Skip to content

Commit 4a5fd88

Browse files
committed
update Merge k sorted lists
1 parent cbf775e commit 4a5fd88

2 files changed

Lines changed: 241 additions & 0 deletions

File tree

SUMMARY.md

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -46,6 +46,7 @@
4646
* [Reverse Linked List](linked_list/reverse_linked_list.md)
4747
* [Reverse Linked List II](linked_list/reverse_linked_list_ii.md)
4848
* [Merge Two Sorted Lists](linked_list/merge_two_sorted_lists.md)
49+
* [Merge k Sorted Lists](linked_list/merge_k_sorted_lists.md)
4950
* [Sort List](linked_list/sort_list.md)
5051
* [Reorder List](linked_list/reorder_list.md)
5152
* [Reverse - 翻转法](reverse/README.md)
Lines changed: 240 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,240 @@
1+
# Merge k Sorted Lists
2+
3+
## Source
4+
5+
- leetcode: [Merge k Sorted Lists | LeetCode OJ](https://leetcode.com/problems/merge-k-sorted-lists/)
6+
- lintcode: [(104) Merge k Sorted Lists](http://www.lintcode.com/en/problem/merge-k-sorted-lists/)
7+
8+
## 题解1 - 选择归并(TLE) <i class="fa fa-thumbs-o-down"></i>
9+
10+
参考 [Merge Two Sorted Lists | Data Structure and Algorithm](http://algorithm.yuanbin.me/linked_list/merge_two_sorted_lists.html) 中对两个有序链表的合并方法,这里我们也可以采用从 k 个链表中选择其中最小值的节点链接到`lastNode->next`(和选择排序思路有点类似),同时该节点所在的链表表头节点往后递推一个。直至`lastNode`遍历完 k 个链表的所有节点,此时表头节点均为`NULL`, 返回`dummy->next`.
11+
12+
这种方法非常简单直接,但是时间复杂度较高,容易出现 TLE.
13+
14+
### C++
15+
16+
```c++
17+
/**
18+
* Definition of ListNode
19+
* class ListNode {
20+
* public:
21+
* int val;
22+
* ListNode *next;
23+
* ListNode(int val) {
24+
* this->val = val;
25+
* this->next = NULL;
26+
* }
27+
* }
28+
*/
29+
30+
class Solution {
31+
public:
32+
/**
33+
* @param lists: a list of ListNode
34+
* @return: The head of one sorted list.
35+
*/
36+
ListNode *mergeKLists(vector<ListNode *> &lists) {
37+
if (lists.empty()) {
38+
return NULL;
39+
}
40+
41+
ListNode *dummy = new ListNode(INT_MAX);
42+
ListNode *last = dummy;
43+
44+
while (true) {
45+
int count = 0;
46+
int index = -1, tempVal = INT_MAX;
47+
for (int i = 0; i != lists.size(); ++i) {
48+
if (NULL == lists[i]) {
49+
++count;
50+
if (count == lists.size()) {
51+
last->next = NULL;
52+
return dummy->next;
53+
}
54+
continue;
55+
}
56+
57+
// choose the min value in non-NULL ListNode
58+
if (NULL != lists[i] && lists[i]->val <= tempVal) {
59+
tempVal = lists[i]->val;
60+
index = i;
61+
}
62+
}
63+
64+
last->next = lists[index];
65+
last = last->next;
66+
lists[index] = lists[index]->next;
67+
}
68+
}
69+
};
70+
```
71+
72+
### 源码分析
73+
74+
1. 由于头节点不定,我们使用`dummy`节点。
75+
2. 使用`last`表示每次归并后的新链表末尾节点。
76+
3. `count`用于累计链表表头节点为`NULL`的个数,若与 vector 大小相同则代表所有节点均已遍历完。
77+
4. `tempVal`用于保存每次比较 vector 中各链表表头节点中的最小值,`index`保存本轮选择归并过程中最小值对应的链表索引,用于循环结束前递推该链表表头节点。
78+
79+
### 复杂度分析
80+
81+
由于每次`for`循环只能选择出一个最小值,总的时间复杂度最坏情况下为 $$O(k \cdot \sum ^{k}_{i=1}l_i)$$. 空间复杂度近似为 $$O(1)$$.
82+
83+
## 题解2 - 迭代调用`Merge Two Sorted Lists`(TLE) <i class="fa fa-thumbs-o-down"></i>
84+
85+
鉴于题解1时间复杂度较高,题解2中我们可以反复利用时间复杂度相对较低的 [Merge Two Sorted Lists | Data Structure and Algorithm](http://algorithm.yuanbin.me/linked_list/merge_two_sorted_lists.html). 即先合并链表1和2,接着将合并后的新链表再与链表3合并,如此反复直至 vector 内所有链表均已完全合并[^soulmachine]
86+
87+
### C++
88+
89+
```c++
90+
/**
91+
* Definition of ListNode
92+
* class ListNode {
93+
* public:
94+
* int val;
95+
* ListNode *next;
96+
* ListNode(int val) {
97+
* this->val = val;
98+
* this->next = NULL;
99+
* }
100+
* }
101+
*/
102+
103+
class Solution {
104+
public:
105+
/**
106+
* @param lists: a list of ListNode
107+
* @return: The head of one sorted list.
108+
*/
109+
ListNode *mergeKLists(vector<ListNode *> &lists) {
110+
if (lists.empty()) {
111+
return NULL;
112+
}
113+
114+
ListNode *head = lists[0];
115+
for (int i = 1; i != lists.size(); ++i) {
116+
head = merge2Lists(head, lists[i]);
117+
}
118+
119+
return head;
120+
}
121+
122+
private:
123+
ListNode *merge2Lists(ListNode *left, ListNode *right) {
124+
ListNode *dummy = new ListNode(0);
125+
ListNode *last = dummy;
126+
127+
while (NULL != left && NULL != right) {
128+
if (left->val < right->val) {
129+
last->next = left;
130+
left = left->next;
131+
} else {
132+
last->next = right;
133+
right = right->next;
134+
}
135+
last = last->next;
136+
}
137+
138+
last->next = (NULL != left) ? left : right;
139+
140+
return dummy->next;
141+
}
142+
};
143+
```
144+
145+
### 源码分析
146+
147+
实现合并两个链表的子方法后就没啥难度了,`mergeKLists`中左半部分链表初始化为`lists[0]`, `for`循环后迭代归并`head`和`lists[i]`.
148+
149+
### 复杂度分析
150+
151+
合并两个链表时最差时间复杂度为 $$O(l_1+l_2)$$, 那么在以上的实现中总的时间复杂度可近似认为是 $$l_1 + l_1+l_2 +...+l_1+l_2+...+l_k = O(\sum _{i=1} ^{k} (k-i) \cdot l_i)$$. 比起题解1复杂度是要小一点,但量级上仍然差不太多。实际运行时间也证明了这一点,题解2的运行时间差不多时题解1的一半。那么还有没有进一步降低时间复杂度的可能呢?当然是有的,且看下题分解...
152+
153+
## 题解3 - 二分调用`Merge Two Sorted Lists`
154+
155+
题解2中`merge2Lists`优化空间不大,那咱们就来看看`mergeKLists`中的`for`循环,仔细观察可得知第`i`个链表 $$l_i$$ 被遍历了 $$k-i$$ 次,如果我们使用二分法对其进行归并呢?从中间索引处进行二分归并后,每个链表参与合并的次数变为 $$\log k$$, 故总的时间复杂度可降至 $$\log k \cdot \sum _{i=1} ^{k} l_i$$. 优化幅度较大。
156+
157+
### C++
158+
159+
```c++
160+
/**
161+
* Definition of ListNode
162+
* class ListNode {
163+
* public:
164+
* int val;
165+
* ListNode *next;
166+
* ListNode(int val) {
167+
* this->val = val;
168+
* this->next = NULL;
169+
* }
170+
* }
171+
*/
172+
173+
class Solution {
174+
public:
175+
/**
176+
* @param lists: a list of ListNode
177+
* @return: The head of one sorted list.
178+
*/
179+
ListNode *mergeKLists(vector<ListNode *> &lists) {
180+
if (lists.empty()) {
181+
return NULL;
182+
}
183+
184+
return helper(lists, 0, lists.size() - 1);
185+
}
186+
187+
private:
188+
ListNode *helper(vector<ListNode *> &lists, int start, int end) {
189+
if (start == end) {
190+
return lists[start];
191+
} else if (start + 1 == end) {
192+
return merge2Lists(lists[start], lists[end]);
193+
}
194+
195+
ListNode *left = helper(lists, start, start + (end - start) / 2);
196+
ListNode *right = helper(lists, start + (end - start) / 2 + 1, end);
197+
198+
return merge2Lists(left, right);
199+
}
200+
201+
ListNode *merge2Lists(ListNode *left, ListNode *right) {
202+
ListNode *dummy = new ListNode(0);
203+
ListNode *last = dummy;
204+
205+
while (NULL != left && NULL != right) {
206+
if (left->val < right->val) {
207+
last->next = left;
208+
left = left->next;
209+
} else {
210+
last->next = right;
211+
right = right->next;
212+
}
213+
last = last->next;
214+
}
215+
last->next = (NULL != left) ? left : right;
216+
217+
return dummy->next;
218+
}
219+
};
220+
```
221+
222+
### 源码分析
223+
224+
由于需要建立二分递归模型,另建一私有方法`helper`引入起止位置较为方便。下面着重分析`helper`
225+
226+
1. 分两种边界条件处理,分别是`start == end``start + 1 == end`. 虽然第二种边界条件可以略去,但是加上会节省递归调用的栈空间。
227+
2. 使用分治思想理解`helper`, `left``right`的边界处理建议先分析几个简单例子,做到不重不漏。
228+
3. 注意`merge2Lists`中传入的参数,为`lists[start]`而不是`start`...
229+
230+
`mergeKLists`中调用`helper`时传入的`end`参数为`lists.size() - 1`,而不是`lists.size()`.
231+
232+
### 复杂度分析
233+
234+
题解中已分析过,最坏的时间复杂度为 $$\log k \cdot \sum _{i=1} ^{k} l_i$$, 空间复杂度近似为 $$O(1)$$.
235+
236+
优化后的运行时间显著减少!由题解2中的500+ms 减至40ms 以内。
237+
238+
## Reference
239+
240+
- [^soulmachine]: [soulmachine的LeetCode 题解](../docs/leetcode-cpp.pdf)

0 commit comments

Comments
 (0)