在列表中查找和排序平均值

时间:2014-03-22 18:56:21

标签: python average

我有一个制表符分隔的文本文件,格式如下:

TITLE   FSAL
Professor   "30,000.00"
Professor   0
Staff   "90,000.00"
Professor   "50,000.00"
Manager "80,000.00"
Professor   "40,000.00"

我的目标是按最高平均工资对职称进行排名。我到目前为止的代码是:

from collections import Counter
job_file = open("jobs.txt", "r")

headers = job_file.readline()
titles = []
salaries = []

for line in job_file.readlines():
  line.rstrip()
  (title, fsal) = line.split('\t')
  #convert fsal from string to float,
  fsal = float(fsal.replace('"', '').replace(',', ''))

  titles.append(title)
  salaries.append(fsal)

#Average salary for all titles
avg_salary = sum(salaries)/len(titles)
print "Average salary for all titles = ", avg_salary
#Average salary for all titles =  48333.3333333

我可以做什么来按职位名称输出平均工资,以便我可以使用.sort()按最高平均工资对其进行排名,即:

average salary for Professor = 30000.0  #(30000.0 + 0.0 + 50000.0 + 40000.0)/4
average salary for Staff = 90000.0  #90000.0/1
average salary for Manager = 80000.0  #80000.0/1

最终输出应如下所示:

1. Staff 90000.0
2. Manager 80000.0
3. Professor 30000.0

1 个答案:

答案 0 :(得分:0)

#!/usr/bin/python
import collections
Job = collections.namedtuple('Job', ['title', 'salary'])
all_jobs = []
with open("jobs.txt", "r") as job_file:
    headers = job_file.readline()
    for line in job_file:
        (title, fsal) = line.rstrip().split('\t')
        fsal = float(fsal.replace('"', '').replace(',', ''))
        all_jobs.append(Job(title, fsal))
avg_salary = sum(
    job.salary for job in all_jobs) / len(all_jobs)
print "Average salary for all titles = ", avg_salary
sorted_jobs = sorted(
    all_jobs, key=lambda job: job.salary, reverse=True)
for i, j in enumerate(sorted_jobs):
    print '%i. %s \t%g' % (i + 1, j.title, j.salary)

编辑:OP想要每个职位的平均值:

#!/usr/bin/python
import collections
Job = collections.namedtuple('Job', ['title', 'salary'])
salaries = {}
with open("jobs.txt", "r") as job_file:
    headers = job_file.readline()
    for line in job_file:
        (title, fsal) = line.rstrip().split('\t')
        fsal = float(fsal.replace('"', '').replace(',', ''))
        if title in salaries:
            salaries[title].append(fsal)
        else:
            salaries[title] = [fsal]
average = lambda alist: sum(alist) / len(alist)
average_salaries = [Job(title, average(salaries[title]))
                    for title in salaries]
sorted_salaries = sorted(
    average_salaries, key=lambda job: job.salary, reverse=True)
for i, j in enumerate(sorted_salaries):
    print '%i. %s \t%g' % (i + 1, j.title, j.salary)