如何仅使用python脚本从json api接收来自选定序列号的数据

时间:2019-04-19 03:26:54

标签: python json web-scraping prometheus

如何仅从选定的序列号接收数据 还是添加序列号列表以排除? ie)“ serialNumber”:“ 121718037628”,已经死亡约2个月了 或自动排除长时间未更新的数据 使用“ lastReportDate”:1549920259,

使用普罗米修斯抓取元数据

然后来自同相微逆变器控制器的流看起来像这样 http://envoy/api/v1/production/inverters(本地网络)

[
  {
    "serialNumber": "121718037628",
    "lastReportDate": 1549920259,
    "devType": 1,
    "lastReportWatts": 18,
    "maxReportWatts": 18
  },
  {
    "serialNumber": "121718037534",
    "lastReportDate": 1555635154,
    "devType": 1,
    "lastReportWatts": 108,
    "maxReportWatts": 187
  },
  {
    "serialNumber": "121718037683",
    "lastReportDate": 1555635148,
    "devType": 1,
    "lastReportWatts": 117,
    "maxReportWatts": 197
  },

我尝试在

中添加此内容
ignore_list = ['121718037628']
       for pattern in ignore_list:
           if fnmatch( pattern):
                should_ignore = True

并尝试

[f for f in serial if not any(a in f.split() for a in faultyunit)]

这是原始的python代码

#!/usr/bin/env python -f

import os
import time
import json
import requests
import threading
from requests.auth import HTTPDigestAuth
from prometheus_client import start_http_server, Gauge


host = os.getenv('ENVOY_HOST')
password = os.getenv('ENVOY_PASS')

user = 'installer'
auth = HTTPDigestAuth(user, password)
marker = b'data: '


serials = {
    121718037663: '#1',
    121718037534: '#1',
    121718037513: '#1',
    121718037414: '#1',
    121718037683: '#1',
    121718037593: '',  
    121718037695: '#1',
    121718037872: '#1',
    121718037601: '#1',
    121718037876: '#2',
    121718037698: '#2',
    121718037881: '#2',
    121718037584: '#2',
    121718037703: '#2',

}


stream_gauges = {
    'p': Gauge('meter_active_power_watts', 'Active Power', ['type', 
'phase']),
    'q': Gauge('meter_reactive_power_watts', 'Reactive Power', 
['type', 'phase']),
    's': Gauge('meter_apparent_power_watts', 'Apparent Power', 
['type', 'phase']),
    'v': Gauge('meter_voltage_volts', 'Voltage', ['type', 'phase']),
    'i': Gauge('meter_current_amps', 'Current', ['type', 'phase']),
    'f': Gauge('meter_frequency_hertz', 'Frequency', ['type', 'phase']),
    'pf': Gauge('meter_power_factor_ratio', 'Power Factor', ['type', 'phase']),
}

production_gauges = {
    'activeCount': Gauge('production_active_count', 'Active Count', ['type']),
    'wNow': Gauge('power_now_watts', 'Active Count', ['type']),
    'whToday': Gauge('production_today_watthours', 'Total production today', ['type']),
    'whLastSevenDays': Gauge('production_7days_watthours', 'Total production last seven days', ['type']),
    'whLifetime': Gauge('production_lifetime_watthours', 'Total production lifetime', ['type']),
}

consumption_gauges = {
    'wNow': Gauge('consumption_now_watts', 'Active Count', ['type']),
    'whToday': Gauge('consumption_today_watthours', 'Total consumption today', ['type']),
    'whLastSevenDays': Gauge('consumption_7days_watthours', 'Total consumption last seven days', ['type']),
    'whLifetime': Gauge('consumption_lifetime_watthours', 'Total consumption lifetime', ['type']),
}

inverter_gauges = {
    'last': Gauge('inverter_last_report_watts', 'Last reported watts', ['serial', 'location']),
    'max': Gauge('inverter_max_report_watts', 'Max reported watts', ['serial', 'location']),
}


def scrape_stream():
    while True:
        try:
            url = 'http://%s/stream/meter' % host
            stream = requests.get(url, auth=auth, stream=True, timeout=5)
            for line in stream.iter_lines():
                if line.startswith(marker):
                    data = json.loads(line.replace(marker, b''))
                    print(data)
                    for meter_type in ['production', 'net-consumption', 'total-consumption']:
                        for phase in ['ph-a', 'ph-b']:
                            for key, value in data.get(meter_type, {}).get(phase, {}).items():
                                if key in stream_gauges:

stream_gauges[key].labels(type=meter_type, phase=phase).set(value)
        except requests.exceptions.RequestException as e:
            print('Exception fetching stream data: %s' % e)
            time.sleep(5)


def scrape_production_json():
    url = 'http://%s/production.json' % host
    data = requests.get(url).json()
    production = data['production']
    print(production)
    for each in production:
        mtype = each['type']
        for key in ['activeCount', 'wNow', 'whLifetime', 'whToday', 'whLastSevenDays']:
            value = each.get(key)
            if value is not None:
                production_gauges[key].labels(type=mtype).set(value)
    consumption = data['consumption']
    print(consumption)
    for each in consumption:
        mtype = each['measurementType']
        for key in ['wNow', 'whLifetime', 'whToday', 'whLastSevenDays']:
            value = each.get(key)
            if value is not None:
                consumption_gauges[key].labels(type=mtype).set(value)



def scrape_inverters():
    url = 'http://%s/api/v1/production/inverters' % host
    data = requests.get(url, auth=auth).json()
    print(data)
    for inverter in data:
        serial = int(inverter['serialNumber'])
        location = serials.get(serial, '')
        inverter_gauges['last'].labels(serial=serial, 
location=location).set(inverter['lastReportWatts'])
        inverter_gauges['max'].labels(serial=serial, 
location=location).set(inverter['maxReportWatts'])


def main():
    start_http_server(8000)
    stream_thread = threading.Thread(target=scrape_stream)
    stream_thread.setDaemon(True)
    stream_thread.start()
    while True:
        try:
            scrape_production_json()
            scrape_inverters()
        except Exception as e:
            print('Exception fetching scrape data: %s' % e)
        time.sleep(60)


if __name__ == '__main__':
    main()

并且我尝试添加此

}

ignorelist = {
    121718037628,
}

for inverter in data:
     if inverter['serialNumber'] in ignorelist:
        continue
         serial = int(inverter['serialNumber'])

但是它会跳过所有逆变器

也尝试过这种方法

json_response = [
{
}
]

但不确定如何从API读取内容

ignore_set = {'121718037628',} 

for inverter in json_response:
    if inverter['serialNumber'] not in ignore_set:
        print(inverter)

最终解决了它,谢谢您的帮助

ignorelist = {
'121718037628','121718037534'
}

for inverter in data:
if inverter['serialNumber'] not in ignorelist:
    print(inverter)
    serial = int(inverter['serialNumber'])
    location = serials.get(serial, '')

2 个答案:

答案 0 :(得分:1)

ignorelist = {
'121718037628','121718037534'
}

for inverter in data:
    if inverter['serialNumber'] not in ignorelist:
        print(inverter)
        serial = int(inverter['serialNumber'])
        location = serials.get(serial, '')

答案 1 :(得分:0)

也许检查序列在忽略列表中,然后进一步跳过设备的处理

for inverter in data:
    if inverter['serialNumber'] not in ignorelist:
        serial = int(inverter['serialNumber'])