#!/bin/python3
# pip3 install requests
# coding=utf8
import os
import time
from urllib.parse import unquote
import requests
import pymysql
headers = {
'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8,'
'application/signed-exchange;v=b3',
'Accept-Encoding': 'gzip, deflate, br',
'Accept-Language': 'zh-CN,zh;q=0.9,en;q=0.8',
'Cache-Control': 'no-cache',
'Connection': 'keep-alive',
'Host': 'officecdn-microsoft-com.akamaized.net',
'Pragma': 'no-cache',
'Sec-Fetch-Mode': 'navigate',
'Sec-Fetch-Site': 'none',
'Sec-Fetch-User': '?1',
'Upgrade-Insecure-Requests': '1',
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) '
'Chrome/78.0.3904.108 Safari/537.36 '
}
# 获取http文件名
def get_file_name(url, headers):
filename = ''
if 'Content-Disposition' in headers and headers['Content-Disposition']:
disposition_split = headers['Content-Disposition'].split(';')
if len(disposition_split) > 1:
if disposition_split[1].strip().lower().startswith('filename='):
file_name = disposition_split[1].split('=')
if len(file_name) > 1:
filename = unquote(file_name[1])
if not filename and os.path.basename(url):
filename = os.path.basename(url).split("?")[0]
if not filename:
return time.time()
return filename
# 下载http文件
def downFile(path, url):
get_file = requests.get(url=url, headers=headers, stream=True, allow_redirects=False, timeout=10)
content_length = get_file.headers['Content-Length']
file_name = get_file_name(url, get_file.headers)
print("文件大小:", content_length, "文件名称:" + file_name)
r = requests.get(url) # 发送请求
# 保存
with open(path + file_name, 'wb') as f:
f.write(r.content)
f.close()
return file_name
# 链接操作数据库
def connectSQL(do_sql):
config = {
'host': '***',
'port': 3306,
'user': '***',
'password': '***',
'database': '***',
'charset': 'utf8mb4',
'cursorclass': pymysql.cursors.Cursor,
}
# 打开数据库连接
db = pymysql.connect(**config)
try:
# 使用cursor()方法创建一个游标对象cursor
cursor = db.cursor()
# 使用execute()方法执行SQL
cursor.execute(do_sql)
db.commit()
print('返回数据的行数或影响的行数: %s' % cursor.rowcount)
# 使用 fetchone() 方法获取单条数据.
result = cursor.fetchall()
return result
except BaseException as err:
print(err)
db.rollback() # 若出错了,则回滚
finally:
# 关闭数据库连接
db.close()
# 表单的post文件上传
def postUrl(file_path, file_name):
# 1.指定url
url = 'http://***-file-api/fileUpload'
# 发起POST请求之前,要处理POST请求携带的参数 流程:
# 一、将POST请求封装到字典
# 上传的文件参数
files = {
"file": (file_name, open(file_path, "rb"), "file")
}
data = {
"file": open(file_path, "rb"),
"projectName": "***-file-api",
"isFixed": ""
}
# 发送请求
response = requests.post(url=url, files=files, data=data)
# 打印结果
print(response.json().get('body').get('intranetUrl'))
return response.json().get('body').get('intranetUrl')
# json格式的post请求
def delFile(fileUrl):
# 指定url
url = 'http://***-file-api/deleteFile'
# 请求头
headers = {"content-type": "application/json"}
# payload 为传入的参数
payload = {
"fileUrl": fileUrl
}
# json形式,参数用json
res = requests.post(url, json=payload, headers=headers)
print(res.json())
if __name__ == '__main__':
path = "D:\\files\\tmp\\"
sql = "SELECT id,test_img_url FROM tmp "
result = connectSQL(sql)
for row in result: # 打印结果
id = row[0]
url = row[1]
file_name = downFile(path, url)
print('id=%s url=%s' % (id, url))
file_path = "D:\\files\\tmp\\" + file_name
new_url = postUrl(file_path, get_file_name(url, headers))
new_sql = "INSERT INTO new_online_img (old_id, test_img_url, new_url) VALUES ({0}, '{1}', '{2}')" \
.format(id, url, new_url)
new_result = connectSQL(new_sql)
print()
print()
print('==========================================')
print()
print()
# 批量删除
# sql = "SELECT new_url FROM new_online_img"
# result = connectSQL(sql)
# for row in result: # 打印结果
# url = row[0]
# print(url)
# delFile(url)