video_util.py
1.32 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
import requests
import pandas as pd
base_URL = 'https://storage.googleapis.com/data.yt8m.org/2/j/i/'
youtube_url = 'https://www.youtube.com/watch?v='
def getURL(vid_id):
vid_id = vid_id[0:4]
URL = base_URL + vid_id[:-2] + '/' + vid_id + '.js'
response = requests.get(URL, verify = False)
if response.status_code == 200:
return youtube_url + response.text[10:-3]
else:
return ""
print(getURL('nzwW'))
def getVideoInfo(vid_id, video_tags_path, top_k, isPerVideo):
print("vid_id = ",vid_id)
video_url = getURL(vid_id[0:4])
entire_video_tags = pd.read_csv(video_tags_path,encoding='utf8')
video_tags_info = entire_video_tags.loc[entire_video_tags["vid_id"] == vid_id]
print(video_tags_info)
video_tags = []
for i in range(1, top_k + 1):
print("vals ",video_tags_info["segment" + str(i)].values)
video_tag_tuple = video_tags_info["segment" + str(i)].values[0]# ex: "mobile-phone:0.361"
video_tags.append(video_tag_tuple.split(":")[0])
if video_url == "":
for x in video_tags:
video_url = video_url + ' ' + x
if isPerVideo == False:
video_url = video_url + '\nThe similar point is : ' + str(float(vid_id[5:]) * 5)
return {
"video_url": video_url,
"video_tags": video_tags
}