headers = {b'Accept': b'application/json, text/javascript, */*; q=0.01', b'Accept-Encoding': b'gzip, deflate', b'Accept-Language': b'zh-CN,zh;q=0.9,ja;q=0.8,ru;q=0.7', b'Cache-Control': b'no-cache', b'Connection': b'keep-alive', b'Content-Length': b'270', b'Content-Type': b'application/x-www-form-urlencoded; charset=UTF-8', b'Cookie': b'insert_cookie=27508778', b'Host': b'nc.mofcom.gov.cn', b'Origin': b'http://nc.mofcom.gov.cn', b'Pragma': b'no-cache', b'Referer': b'http://nc.mofcom.gov.cn/jghq/marketDetail?eudId=45233', b'User-Agent': b'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/111.0.0.0 Safari/537.36', b'X-Requested-With': b'XMLHttpRequest'} citys = {'安徽': '340000', '北京': '110000', '福建': '350000', '甘肃': '620000', '广东': '440000', '广西': '450000', '贵州': '520000', '海南': '460000', '河北': '130000', '河南': '410000', '黑龙江': '230000', '湖北': '420000', '湖南': '430000', '吉林': '220000', '江苏': '320000', '江西': '360000', '辽宁': '210000', '内蒙古': '150000', '宁夏': '640000', '青海': '630000', '山东': '370000', '山西': '140000', '陕西': '610000', '上海': '310000', '四川': '510000', '天津': '120000', '西藏': '540000', '新疆': '650000', '云南': '530000', '浙江': '330000', '重庆': '500000'} for city,value in citys.items(): url = 'http://nc.mofcom.gov.cn/jghq/marketList' m = 'province={}&city=&isprod_mark=&par_craft_index=&pageNo=1'.format(value) h = requests.post(url=url, data=m, headers=headers) print(h.json()) for resu in h.json()['result'][:1]: EUD_NAME = resu['EUD_NAME'] print(EUD_NAME) ID = resu['ID'] CONTENT = resu['CONTENT'] m1 = 'pageNo={}&craftName=&craftIndex=&eudName={}&queryDateType=0&timeRange=&sortColumns=%5B%7B%22column%22%3A%22GET_P_DATE%22%2C%22ordername%22%3A%22asc%22%7D%5D' url2 = 'http://nc.mofcom.gov.cn/jghq/marketDetail' for i in range(1,7): h1 = requests.post(url=url2, data=m1.format(i,parse.quote(EUD_NAME)), headers=headers) print(h1.json()) for resu in h1.json()['result']: if not models.XinXi.query.filter(and_(models.XinXi.日期==time.strftime('%Y-%m-%d', time.localtime(resu['GET_P_DATE'] // 1000)), models.XinXi.详情=='http://nc.mofcom.gov.cn/jghq/marketDetail?eudId={}'.format(ID), models.XinXi.产品==resu['CRAFT_NAME'] )).all(): models.db.session.add( models.XinXi( 日期=time.strftime('%Y-%m-%d', time.localtime(resu['GET_P_DATE'] // 1000)), 产品=resu['CRAFT_NAME'], 价格=resu['AG_PRICE'], 市场=resu['EUD_NAME'], 省份=city, 详情='http://nc.mofcom.gov.cn/jghq/marketDetail?eudId={}'.format(ID), 介绍=CONTENT ) ) models.db.session.commit() |
from pyspark.sql import SparkSessionfrom pyspark.sql.functions import avg, min, max # 创建 SparkSession spark = SparkSession.builder \ .appName("AgriPriceAnalysis") \ .getOrCreate() # 读取 CSV 文件,假设文件路径为 'agri_prices.csv' df = spark.read.csv('agri_prices.csv', header=True, inferSchema=True) # 查察数据布局 df.printSchema() # 显示数据前几行 df.show() # 盘算平均价格 avg_price = df.select(avg("price")).first()[0]print("Average Price:", avg_price) # 盘算最高价格 max_price = df.select(max("price")).first()[0]print("Maximum Price:", max_price) # 盘算最低价格 min_price = df.select(min("price")).first()[0]print("Minimum Price:", min_price) # 制止 SparkSession spark.stop() |
欢迎光临 ToB企服应用市场:ToB评测及商务社交产业平台 (https://dis.qidao123.com/) | Powered by Discuz! X3.4 |