【发布时间】:2017-01-19 11:06:48
【问题描述】:
我正在尝试使用 xlsxwriter 创建一个 excel 文件并将文件命名为当前日期和时间。对于上下文,我想将其添加到网络爬虫中,该爬虫设置为每天中午运行并将其导出到 Excel。我希望文件名与抓取时间相对应。
我尝试使用 datetime 函数没有成功:
import xlsxwriter
import datetime
# Create a workbook and add a worksheet.
todays_date = "'" + datetime.datetime.now().strftime("%Y-%m-%d %H:%M") + '.xlsx' + "'"
workbook = xlsxwriter.Workbook(todays_date)
worksheet = workbook.add_worksheet()
# Some data we want to write to the worksheet.
expenses = (
['Rent', 1000],
['Gas', 100],
['Food', 300],
['Gym', 50],
)
# Start from the first cell. Rows and columns are zero indexed.
row = 0
col = 0
# Iterate over the data and write it out row by row.
for item, cost in (expenses):
worksheet.write(row, col, item)
worksheet.write(row, col + 1, cost)
row += 1
# Write a total using a formula.
worksheet.write(row, 0, 'Total')
worksheet.write(row, 1, '=SUM(B1:B4)')
workbook.close()
有谁知道为什么这不起作用或其他替代方法?
@Sandeep Hukku - 编辑代码如下:
import xlsxwriter
import datetime
# Create a workbook and add a worksheet.
# todays_date = "'" + datetime.datetime.now().strftime("%Y-%m-%d %H:%M") + '.xlsx' + "'"
todays_date = str(datetime.datetime.now().strftime("%Y-%m-%d %H:%M") )+ '.xlsx'
workbook = xlsxwriter.Workbook(todays_date)
worksheet = workbook.add_worksheet()
# Some data we want to write to the worksheet.
expenses = (
['Rent', 1000],
['Gas', 100],
['Food', 300],
['Gym', 50],
)
# Start from the first cell. Rows and columns are zero indexed.
row = 0
col = 0
# Iterate over the data and write it out row by row.
for item, cost in (expenses):
worksheet.write(row, col, item)
worksheet.write(row, col + 1, cost)
row += 1
# Write a total using a formula.
worksheet.write(row, 0, 'Total')
worksheet.write(row, 1, '=SUM(B1:B4)')
workbook.close()
@Snehal Parmar - 第二次更新:
导入 urllib 导入 urllib.request 从 bs4 导入 BeautifulSoup 导入日期时间 导入 xlsxwriter
# Web scraping
def make_soup(url):
the_page = urllib.request.urlopen(url)
soup_data = BeautifulSoup(the_page, "html.parser")
return soup_data
soup = make_soup('http://www.url.co.uk')
def getNames():
for record in soup.findAll('tr'):
for data in record.findAll('td'):
for td_in_data in data.findAll('td', {"class": "propname"}):
print(td_in_data.text)
def getRooms():
for record in soup.findAll('tr'):
for data in record.findAll('td'):
for td_in_data in data.findAll('span', {"class": "beds"}):
print(td_in_data.text)
def getRents():
for record in soup.findAll('tr'):
for data in record.findAll('td'):
for td_in_data in data.findAll('td', {"class": "rentprice"}):
print(td_in_data.text)
''' To do: get the scraped data to an Excel doc.'''
# Create a workbook and add a worksheet.
todays_date = str(datetime.datetime.now().strftime("%Y-%m-%d %H:%M") )+ '.xlsx'
todays_date = todays_date.replace(" ", "_").replace(":", "_")
workbook = xlsxwriter.Workbook(todays_date)
worksheet = workbook.add_worksheet()
# Data to Excel.
Excel_dump = (
['Name', getNames()],
['Rent', getRents()],
['Rooms', getRooms()]
)
# Start from the first cell. Rows and columns are zero indexed.
row = 0
col = 0
# Iterate over the data and write it out row by row.
for item, cost in Excel_dump:
worksheet.write()
worksheet.write(col, row, item)
worksheet.write(col, row + 1)
row += 1
【问题讨论】:
标签: python datetime xlsxwriter