a = list([1, 3, 3])
b = list([1, 2, 2])

(a < b) == False
(b < a) == True

我希望列表中的值是函数,在ab的情况下,index = 2的值(即函数)不会被计算为index = 1(a[1]==3, b[1]==2)的值已足以确定b < a




def lex_comp(a, b):
  for func_a, func_b in izip(a, b):
    v_a = func_a()
    v_b = func_b()
    if v_a < v_b: return -1
    if v_b > v_a: return +1
  return 0

def foo1(): return 1
def foo2(): return 1

def bar1(): return 1
def bar2(): return 2

def func1(): return ...
def func2(): return ...

list_a = [foo1, bar1, func1, ...]
list_b = [foo2, bar2, func2, ...]

# now you can use the comparator for instance to sort a list of these lists
sort([list_a, list_b], cmp=lex_comp)

import itertools

def f(a, x):
    print "lazy eval of {}".format(a)
    return x

a = [lambda: f('a', 1), lambda: f('b', 3), lambda: f('c', 3)]
b = [lambda: f('d', 1), lambda: f('e', 2), lambda: f('f', 2)]
c = [lambda: f('g', 1), lambda: f('h', 2), lambda: f('i', 2)]

def lazyCmpList(a, b):
    l = len(list(itertools.takewhile(lambda (x, y): x() == y(), itertools.izip(a, b))))
    if l == len(a):
        return 0
        return cmp(a[l](), b[l]())

print lazyCmpList(a, b)
print lazyCmpList(b, a)
print lazyCmpList(b, c)


lazy eval of a
lazy eval of d
lazy eval of b
lazy eval of e
lazy eval of d
lazy eval of a
lazy eval of e
lazy eval of b
lazy eval of d
lazy eval of g
lazy eval of e
lazy eval of h
lazy eval of f
lazy eval of i

请注意,代码假定函数列表的长度相同。它可以被增强以支持不相等的列表长度,你必须定义逻辑是什么,即cmp([f1, f2, f3], [f1, f2, f3, f1])应该产生什么?



>>> def f(x):
...   return 2**x
>>> def g(x):
...   return x*2
>>> [f(x) for x in range(1,10)]
[2, 4, 8, 16, 32, 64, 128, 256, 512]
>>> [g(x) for x in range(1,10)]
[2, 4, 6, 8, 10, 12, 14, 16, 18]
>>> zipped = zip((f(i) for i in range(1,10)),(g(i) for i in range(1,10)))
>>> x,y = next(itertools.dropwhile(lambda t: t[0]==t[1],zipped))
>>> x > y
>>> x < y
>>> x
>>> y

import random
import itertools
import functools

num_rows = 100
data = [[random.randint(0, 2) for i in xrange(10)] for j in xrange(num_rows)]

# turn data values into functions.
def return_func(value):
    return value

list_funcs = [[functools.partial(return_func, v) for v in row] for row in data]

def lazy_cmp_FujiApple(a, b):
    l = len(list(itertools.takewhile(lambda (x, y): x() == y(), itertools.izip(a, b))))
    if l == len(a):
        return 0
        return cmp(a[l](), b[l]())

sorted1 = sorted(list_funcs, lazy_cmp_FujiApple)
%timeit sorted(list_funcs, lazy_cmp_FujiApple)
# 100 loops, best of 3: 2.77 ms per loop

def lex_comp_mine(a, b):
    for func_a, func_b in itertools.izip(a, b):
        v_a = func_a()
        v_b = func_b()
        if v_a < v_b: return -1
        if v_a > v_b: return +1
    return 0

sorted2 = sorted(list_funcs, cmp=lex_comp_mine)
%timeit sorted(list_funcs, cmp=lex_comp_mine)
# 1000 loops, best of 3: 930 µs per loop

def lazy_comp_juanpa(a, b):
    x, y = next(itertools.dropwhile(lambda t: t[0]==t[1], itertools.izip(a, b)))
    return cmp(x, y)

sorted3 = sorted(list_funcs, cmp=lazy_comp_juanpa)
%timeit sorted(list_funcs, cmp=lex_comp_mine)
# 1000 loops, best of 3: 949 µs per loop

%timeit sorted(data)
# 10000 loops, best of 3: 45.4 µs per loop

# print sorted(data)
# print [[c() for c in row] for row in sorted1]
# print [[c() for c in row] for row in sorted2]
# print sorted3

我想创建一个中间列表会损害@ FujiApple版本的性能。在原始data列表上运行比较器版本并将运行时与Python的本机列表排序进行比较时,我注意到我的版本慢了大约10倍(501μs对每个循环45.4μs)。我想这是不容易接近Python本机实现的性能......