[英]Extract data from python to excel
我有以下代码
from psaw import PushshiftAPI
import datetime
import pandas_datareader as web
import pandas as pd
api = PushshiftAPI()
start_time = int(datetime.datetime(2021,3,16).timestamp())
submissions = api.search_submissions(after=start_time,
subreddit='wallstreetbets',
filter=['url','author','title','subreddit'])
for submission in submissions:
#print(submission.created_utc)
#print(submission.title)
#print(submission.url)
words = submission.title.split()
cashtags = list(set(filter(lambda word: word.lower().startswith('$'), words)))
if len(cashtags) > 0:
print(cashtags)
print(submission.created_utc)
print(submission.title)
print(submission.url)
我想将数据导出到 excel 文件中,但我遇到了问题。 你们能帮忙吗? 我见过很多人使用“熊猫”,但我无法真正让它发挥作用。
我试过你的代码,但现金标签列表是空的,所以我写了try... except
这部分,以防这个问题恰好发生在我身上。 数据的 rest 应保存在 excel 文件中。 检查下面的代码:
from psaw import PushshiftAPI
import datetime
import openpyxl
import os
def save_submissions(submissions_file, submissions):
wb = openpyxl.reader.excel.load_workbook(submissions_file)
sheet = wb.active
num = 1
sheet["A"+str(num)] = "created_utc"
sheet["B"+str(num)] = "title"
sheet["C"+str(num)] = "url"
sheet["D"+str(num)] = "cashtags"
for submission in submissions:
num += 1
sheet["A"+str(num)] = submission.created_utc
sheet["B"+str(num)] = submission.title
sheet["C"+str(num)] = submission.url
try:
words = submission.title.split()
cashtags = list(set(filter(lambda word: word.lower().startswith('$'), words)))
sheet["D"+str(num)] = cashtags
except:
continue
wb.save(submissions_file)
api = PushshiftAPI()
start_time = int(datetime.datetime(2021,3,16).timestamp())
submissions = api.search_submissions(after=start_time,
subreddit='wallstreetbets',
filter=['url','author','title','subreddit'])
#create excell file
cwd = os.getcwd()
submissions_file = os.path.join(cwd, 'submissions.xlsx')
wb = openpyxl.Workbook()
wb.save(submissions_file)
save_submissions(submissions_file, submissions)
声明:本站的技术帖子网页,遵循CC BY-SA 4.0协议,如果您需要转载,请注明本站网址或者原文地址。任何问题请咨询:yoyou2525@163.com.