获取AVA数据集

上传一个自己写的获取AVA数据集的代码

"""
下载AVA动作数据集
2021/10/11:
新增:
    1. 断线重连(等待5秒后尝试重连)
    2. 假如要保存的文件路径不存在,则创建
"""
import os
import time

import requests
from contextlib import closing


# 要读取的txt文件
txts = ['ava_file_names_trainval_v2.1.txt', 'ava_file_names_test_v2.1.txt']
# 文件的链接路径
urls = ['https://s3.amazonaws.com/ava-dataset/trainval/', 'https://s3.amazonaws.com/ava-dataset/test/']
# 要保存的文件路径
saves = ['AVA_Videos/train', 'AVA_Videos/test']


def download(txts=txts, urls=urls, saves=saves):
    try:
        # 循环读取文件
        for i in range(len(txts)):
            # 读取文件内容
            with open(txts[i], 'r') as f:
                # 获取所有行
                lines = f.readlines()
                index = 0
                # 判断保存路径是否存在
                if not os.path.exists(saves[i]):
                    os.mkdir(saves[i])
                # 分别读取每一行
                for line in lines:
                    index += 1
                    # url地址拼接
                    url = os.path.join(urls[i], line.rstrip('\n'))
                    # 保存地址
                    savePath = os.path.join(saves[i], line.rstrip('\n'))
                    # 显示文件完整链接
                    print('\n' + url)
                    with closing(requests.get(url, stream=True)) as response:
                        chunk_size = 1024  # 单次请求最大值 1KB
                        content_size = int(response.headers['content-length'])  # 内容体总大小
                        data_count = 0  # 初始进度
                        # 如果文件已经存在,则比对文件大小,
                        if os.path.exists(savePath):
                            print('{} 已存在,将比对文件大小 本地文件: {} - 远程文件: {}'.format(savePath, os.path.getsize(savePath), content_size))
                        # 如果下载完成,则跳过
                        if os.path.exists(savePath) and os.path.getsize(savePath) == content_size:
                            print('{} 已经下载完成,下载下一个文件'.format(savePath))
                            continue
                        with open(savePath, 'wb') as file:
                            # 循环写入
                            for data in response.iter_content(chunk_size=chunk_size):
                                file.write(data)
                                data_count = data_count + len(data)
                                now_jd = (data_count / content_size) * 100
                                # 打印进度条,以MB为单位
                                print("\r {} / {} 文件下载进度:{:.2f}% ({:.2f}MB / {:.2f}MB) - {}".format(index, len(lines), now_jd, data_count/1024/1024, content_size/1024/1024, savePath), end=" ")

            print('全部下载完成!')
    except Exception:
        sleep = 5
        for i in range(sleep):
            print('\r网络中断,{}s后尝试重新下载!'.format(sleep - i), end='')
            time.sleep(1)
        print('\r开始尝试重新下载!', end='')
        download(txts=txts, urls=urls, saves=saves)


download(txts=txts, urls=urls, saves=saves)

ava_file_names_trainval_v2.1.txt

_-Z6wFjXtGQ.mkv
_145Aa_xkuE.mp4
_7oWZq_s_Sk.mkv
_a9SWtcaNj8.mkv
_Ca3gOdOHxU.mp4
_dBTTYDRdRQ.webm
_eBah6c5kyA.mkv
_ithRWANKB0.mp4
_mAfwH6i90E.mkv
-5KQ66BBWC4.mkv
-FaXLcSFjUI.mp4
-IELREHX_js.mp4
-OyDO1g74vc.mp4
-XpUuIgyUHE.mp4
-ZFgsrolSxo.mkv
053oq2xB3oU.mkv
0f39OWEqJ24.mp4
0wBYFahr3uI.mp4
1j20qq1JyX4.mp4
1ReZIMmD_8E.mp4
26V9UzqSguo.mp4
2bxKkUgcqpk.mp4
2DUITARAsWQ.mp4
2E_e8JlvTlg.mkv
2FIHxnZKg6A.webm
2fwni_Kjf2M.mkv
2KpThOF_QmE.mkv
2PpxiG0WU18.mkv
2qQs3Y9OJX0.mkv
3_VjIRdXVdM.mkv
32HR3MnDZ8g.mp4
3IOE-Q3UWdA.mp4
4gVsDd8PV9U.mp4
4k-rTF3oZKw.mp4
4Y5qi1gD2Sw.mkv
4ZpjKfu6Cl8.mkv
55Ihr6uVIDA.mkv
5BDj0ow5hnA.mp4
5LrOQEt_XVM.mp4
5milLu-6bWI.mp4
5MxjqHfkWFI.mkv
5YPjcdLbs5g.mkv
6d5u6FHvz7Q.mkv
7g37N3eoQ9s.mkv
7nHkh4sP5Ks.mkv
7T5G0CmwTPo.mkv
7YpF6DntOYw.mkv
8aMv-ZGD4ic.mkv
8JSxLhDMGtE.mkv
8nO5FFbIAog.webm
8VZEwOCQ8bc.mkv
914yZXz-iRs.mkv
9bK05eBt1GM.mp4
9eAOr_ttXp0.mkv
9F2voT6QWvQ.mkv
9HOMUW7QNFc.mkv
9IF8uTRrWAM.mkv
9mLYmkonWZQ.mkv
9QbzS8bZXFE.mkv
9Rcxr3IEX4E.mkv
9tyiDEYiWiA.mkv
9Y_l9NsnYE0.mp4
aDEYi1OG0vU.mkv
Ag-pXiLrd48.mp4
aMYcLyh9OhU.mkv
AN07xQokfiE.mp4
aRbLw-dU2XY.mp4
ax3q-RkVIt4.mp4
ayAMdYfJJLk.mkv
AYebXQ8eUkM.mkv
b-YoBU0XT90.mp4
B1MAUxpKaV8.mkv
b50s4AlOOKY.mkv
b5pRYl_djbs.mp4
bAVXp1oGjHA.mkv
BCiuXAuCKAU.mp4
bePts02nIY8.mkv
bhlFavrh7WU.mkv
bSZiZ4rOC7c.mkv
BXCh3r-pPAM.mkv
BY3sZmvUp-0.mp4
C25wkwAMB-w.mkv
C3qk4yAMANk.mkv
c9pEMjPT16M.webm
cc4y-yYm5Ao.mkv
CG98XdYsgrA.mkv
cKA-qeZuH_w.mkv
cLiJgvrDlWw.mp4
CMCPhm2L400.mkv
covMYDBa5dk.mp4
CrlfWnsS7ac.mkv
cWYJHb25EVs.mp4
CZ2NP8UsPuE.mkv
D-BJTU6NxZ8.mkv
D8Vhxbho1fY.mp4
Db19rWN5BGo.mkv
dgLApPvmfBE.mkv
Di1MG6auDYo.mkv
dMH8L7mqCNI.mkv
E2jecoyAx1M.mkv
E7JcKooKVsM.mp4
eA55_shhKko.mkv
Ecivp8t3MdY.mkv
Ekwy7wzLfjc.mkv
er7eeiJB6dI.mkv
F3dPH6Xqf5M.mp4
fD6VkIRlIRI.mkv
Feu1_8NazPE.mp4
fGgnNCbXZ20.mp4
fNcxxBjEOgw.mkv
fpprSy6AzKk.mkv
fZs-yXm-uUs.mp4
g1wyIcLPbq0.mp4
G4qq1MRXCiY.mkv
G5Yr20A5z_Q.mkv
GBXK_SyfisM.mkv
Gfdg_GcaNe8.mkv
gjasEUDkbuc.mkv
gjdgj04FzR0.mp4
GozLjpMNADg.mkv
gqmmpoO1JrY.mkv
Gt61_Yekkgc.mp4
Gvp-cj3bmIY.webm
hbYvDvJrpNk.mp4
hHgg9WI8dTk.mkv
Hi8QeP_VPu0.mkv
HJzgJ9ZjvJk.mkv
HKjR70GCRPE.mp4
Hscyg0vLKc8.mp4
HTYT2vF-j_w.mkv
HV0H6oc4Kvs.mkv
HVAmkvLrthQ.mkv
HymKCzQJbB8.mkv
I8j6Xq2B5ys.mp4
Ie35yEssHko.mkv
IKdBLciu_-A.mp4
iSlDMboCSao.mkv
IuPC-z-M9u8.mkv
IzvOYVMltkI.mp4
J1jDc2rTJlg.mkv
j35JnR0Q7Es.mp4
J4bt4y9ShTA.mkv
j5jmjhGBW44.mkv
jBs_XYHI7gM.mkv
jE0S8gYWftE.webm
jgAwJ0RqmYg.mp4
jI0HIlSsa3s.mkv
JNb4nWexD0I.mkv
jqZpiHlJUig.mkv
K_SpqDJnlps.mkv
kAsz-76DTDE.mkv
Kb1fduj-jdY.mp4
KHHgQ_Pe4cI.mkv
KIy2a-nejxg.mp4
kLDpP9QEVBs.mp4
kMy-6RtoOVU.mkv
kplbKz3_fZk.mkv
Ksd1JQFHYWA.mp4
KVq6If6ozMY.mkv
KWoSGtglCms.mkv
l-jxh8gpxuY.mkv
l2XO3tQk8lI.mkv
lDmLcWWBp1E.mkv
Lg1jOu8cUBM.mkv
LIavUJVrXaI.mkv
LrDT25hmApw.mkv
lT1zdTL-3SM.mkv
lWXhqIAvarw.mkv
M6cgEs9JgDo.mkv
Ma2hgTmveKQ.mkv
mfsbYdLx9wE.mkv
miB-wo2PfLI.mkv
mkcDANJjDcM.mkv
N0Dt9i9IUNg.mkv
N1K2bEZLL_A.mkv
N5UD8FGzDek.mkv
N7baJsMszJ0.mkv
NEQ7Wpf-EtI.mkv
nlinqZPgvVk.mkv
NO2esmws190.mkv
O_NYCUhZ9zw.mp4
o4xQ-BEa3Ss.mkv
O5m_0Yay4EU.mkv
oD_wxyTHJ2I.mp4
OfMdakd4bHI.mkv
OGNnUvJq9RI.mkv
oifTDWZvOhY.mkv
oITFHwzfw_k.mkv
om_83F5VwTQ.mp4
oq_bufAhyl8.mkv
Ov0za6Xb1LM.mkv
oWhvucAskhk.mkv
P60OxWahxBQ.mkv
P90hF2S1JzA.mkv
PcFEhUKhN6g.mkv
pGP_oIdKmRY.mkv
phrYEKv0rmw.mkv
phVLLTMzmKk.mkv
pieVIsGmLsc.mkv
piYxcrMxVPw.mkv
plkJ45_-pMk.mp4
PmElx9ZVByw.mp4
PNZQ2UJfyQE.mp4
QaIMUi-elFo.mkv
qBUu7cy-5Iw.mp4
QCLQYnt3aMo.webm
QD3L10bUnBo.mkv
QJzocCGLdHU.mp4
QMwT7DFA5O4.mkv
QotkBTEePI8.mkv
qpoWHELxL-4.mp4
qrkff49p4E4.mp4
qsTqtWVVSLM.mkv
QTmwhrVal1g.mkv
qx2vAO5ofmo.mp4
r2llOyS-BmE.mkv
rCb9-U4TArw.mp4
rFgb2ECMcrY.mkv
ri4P2enZT9o.mkv
Riu4ZKk4YdQ.webm
rJKeqfTlAeY.mkv
rk8Xm0EAOWs.mkv
Rm518TUhbRY.mkv
rUYsoIIE37A.mp4
rXFlJbXyZyc.mkv
S0tkhGJjwLA.mkv
sADELCyj10I.mkv
SCh-ZImnyyk.mp4
SHBMiL5f_3Q.mkv
skiZueh4lfY.mkv
sNQJfYvhcPk.mp4
sUVhd0YTKgw.mkv
T-Fc9ctuNVI.mkv
t0V4drbYDnc.mkv
t1LXrJOvPDg.mkv
T26G6_AjJZ4.mkv
TcB0IFBwk-k.mkv
TCmNvNLRWrc.mkv
tEoJW9ycmSY.mkv
TEQ9sAj-DPo.mp4
tghXjom3120.mkv
tjqCzVjojCo.mkv
TM5MPJIq1Is.mkv
tNpZtigMc4g.mkv
tt0t_a1EDCE.mkv
TzaVHtLXOzY.mkv
U_WzY2k8IBM.mkv
u1ltv6r14KQ.mkv
UgZFdrNT6W0.mkv
uNT6HrrnqPU.webm
UOfuzrwkclM.mkv
UOyyTUX5Vo4.mkv
uq_HBsvP548.mkv
UrsCy6qIGoo.mkv
UsLnxI_zGpY.mkv
uwW0ejeosmk.mkv
uzPI7FcF79U.mkv
v0L-WkMO3s4.mp4
vBbjA4tWCPg.mp4
vfjywN5CN0Y.mkv
Vmef_8MY46w.mkv
VRlpH1MbWUw.mp4
VsYPP2I0aUQ.mkv
wEAeql4z1O0.mp4
wfEOx36N4jA.mp4
WKqbLbU68wU.mkv
WlgxRNCHQzw.mkv
wogRuPNBUi8.mp4
wONG7Vh87B4.mkv
WSPvfxtqisg.mkv
WVde9pyaHg4.mkv
x-6CtPWVi6E.mkv
X5wWhZ2r9kc.mp4
xeGWXqSvC-8.webm
XF87VL5T0aA.mkv
XglAvHaEtHY.mp4
xJmRNZVDDCY.mkv
xmqSaQPzL1E.mkv
xO4ABy2iOQA.mp4
xp67EC-Hvwk.mkv
XpGRS72ghag.mkv
XV_FF3WC7kA.mkv
y7ncweROe9U.mkv
yMtGmGa8KZ0.mkv
yn9WN9lsHRE.mkv
yo-Kg2YxlZs.mkv
yqImJuC5UzI.mp4
Ytga8ciKWJc.mkv
yvgCGJ6vfkY.mkv
YYWdB7h1INo.mkv
z-fsLpGHq6o.mkv
Z1YV6wB037M.mkv
z3kgrh0L_80.mkv
zC5Fh2tTS1U.mp4
zG7mx8KiavA.mp4
zlVkeKC6Ha8.mp4
ZosVdkY76FU.mkv
zR725veL-DI.mkv
ZxQn8HVmXsY.mkv

ava_file_names_test_v2.1.txt

--205wugM18.mkv
-APF0-L14kw.mkv
-FLn0aeA6EU.mkv
0OLtK6SeTwo.mp4
1R7n8B8KkZE.mkv
1XZZnWMP4CU.mkv
2eTGj8zPykM.mkv
3-ivkPTSTSw.mp4
30Qkf0pq-PY.mkv
55R6Ng9w65o.mkv
6IebItD0ETQ.mkv
72MzYjWz_7g.mkv
7QstV153hbA.mkv
7SGCpWCNN84.mp4
7oY-kE-goOA.mkv
8FYx0LtfPTE.mkv
8oL0i5WorkE.mp4
9f8r96-it6c.mkv
A8SUe2Yqn60.mkv
A9WSiEDeu0I.mkv
AwlY-zteegM.mkv
BD3zaLKhkV4.mkv
BLDTynQwGRI.mkv
BU98nWUtT5E.mkv
BV1VreCWZ64.mkv
BnIFkfDhJ2w.mkv
DaUzhc9_6io.mp4
E-6ruyZFfZs.mkv
E-fqjlYMFhE.mp4
EHMP5-9KUdI.mp4
EO1gLAoEZRA.mp4
FONjBIXaM-0.mp4
G0gDuIVKiXg.mkv
GElolK2jG50.mkv
GQxKfbvL3mg.mkv
Gsm_ZBStr0s.mp4
HPd4eMvs1Kg.mp4
HeKz7BELAQc.mkv
HtXWX0LnifY.mp4
IC5M1EhJNfI.webm
IIyYHprTP58.webm
Ic0LMbDyc9Y.mkv
JiBiCiK9HjY.mp4
K-tICG1ek-E.mp4
Ke8b1_yiUVQ.mkv
KkAf75yOKqs.mkv
KrMSZUQJlNM.mkv
LO964EmiVfo.mkv
Mz0FKktvMLY.mkv
NUwem2aZa0Y.mp4
O5y8zKl9X2E.mp4
O8xkUcUJPNo.mkv
OEUMcSba9t0.mp4
OL_Wwo5W1Zs.mp4
OQxN4ksema0.mkv
P5EhajqkqPw.mkv
QTf_v67C5KI.mp4
Qes4a8HuyEc.mkv
RCNuAys0Hsg.mkv
RW-H3fN_79I.mp4
Scg5LeZszCc.mkv
Sntyb4omSfU.mkv
SoNhz0WJZsI.mkv
Uw7387tc9PU.mp4
V6RX59GT-3k.mkv
VNZ8JDb8sks.mkv
ViY7CR2TSO8.mkv
W8TFzEy0gp0.mkv
WMFTBgYWJS8.mkv
Wgytpy6TeUA.mp4
WhkON_S-pQc.mp4
XOe9GeojzCs.mp4
YAAUPjq-L-Q.mp4
Z0FEElATNjk.mkv
Z42lnoj2n08.mkv
ZS2C28fDC9U.mp4
ZbeMNLwASVo.mkv
ZsgPK0XGYoM.mp4
Zu4iQJrlpo0.mkv
_kbrVsCaaPo.mp4
_vy57h5Oeys.mkv
aDfOtlsdoWw.mkv
bNP8Q_8u89A.webm
bUVls-bf0jM.mkv
bzGQK5lH-RA.mkv
c5mlhcFYYZs.mp4
cYt6NaQgcEk.mp4
cqkChR44vkA.mkv
fT_WjgJ_-r0.mkv
gEI9qBdVt5I.mp4
h7Atb503JwY.webm
hgmK4Epb02E.mkv
i9cuy3teV0w.mkv
ipBRBABLSAk.mkv
jKKXDh4lYd0.mkv
kW5WyJ1QNpM.mkv
keUOiCcHtoQ.mkv
kvFlbTK812w.mkv
l8_Mk3-sZsQ.mkv
nAg_NVzLoAY.mkv
nRzhjXMIXt4.mkv
o-ZcbjLBtls.mkv
ohn_RxyaCy4.mp4
pSE4Dlork1Y.mp4
pSdPmmJ3-ng.mp4
rJibAAUEMDY.mkv
rRL0Ce8e-RY.mkv
rTCch_5JlkA.mp4
s2z5UASlrP8.mkv
sV3zZROy0uc.mkv
tDF-BqFfF78.mkv
tj-VmrMYtUI.mp4
u97DLHpcw7c.mkv
vL7N_xRJKJU.mp4
vsMgg4snZzM.mkv
w-jIrlwuv2Y.mkv
wamBSoyRtbs.mkv
woC9Vfbn74I.mkv
xH1WLtZ8csM.mp4
xJpDPrwLJh4.mkv
xT2ogY6xEsI.mp4
xYUx0drhUNk.mkv
xauSNGP5yA0.mkv
xdDTWBRWPLQ.mkv
y4lBI_gFnqI.mkv
y5o8w0FRj98.mkv
yQdi5Ke4dNY.mkv
yRRZkwtJCwU.mkv
z5lg_3abT-s.mkv
zm78XnWN7MU.mkv
zvxnOrzTg0M.mp4

运行时截图

在这里插入图片描述

评论 1
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值