With a list of YouTube videoIDs in a text file, the code below aims to loop through these while getting the comment feeds from all these videos. Could anyone spot the looping error(s) I must have made, but cannot find?
# Set the videoID list
f = open('video_ids.txt', 'r')
videoID_list = f.read().splitlines()
f.close()
# Cycle through videoID list getting comments via the YouTube API
for video_id in videoID_list:
#Define the comments generator
def comments_generator(yt_service, video_id):
comment_feed = yt_service.GetYouTubeVideoCommentFeed(video_id=video_id)
while comment_feed is not None:
for comment in comment_feed.entry:
yield comment
next_link = comment_feed.GetNextLink()
if next_link is None:
comment_feed = None
else:
comment_feed = yt_service.GetYouTubeVideoCommentFeed(next_link.href)
for comment in comments_generator(yt_service, video_id):
# About the video
video_title = entry.media.title.text
video_date = entry.published.text
# About comments
author_name = comment.author[0].name.text
raw_text = comment.content.text
comment_date = comment.published.text
# Keep only alphanumeric characters and spaces in the comment text
text = re.sub(r'\W+', ' ', raw_text)
# Write to a file ('a' means append) - Comment text is set to lowercase [.lower()]
f = open('video_comments.tsv', 'a')
f.write("{}\t{}\t{}\t{}\t{}\t{}\t\r".format(video_title, video_date[:10], comment_date[:10], comment_date[11:19], author_name, text.lower()))
# Also print results on screen - Comment text is set to lowercase [.lower()]
print("{}\t{}\t{}\t{}\t{}\t{}\t\r".format(video_title, video_date[:10], comment_date[:10], comment_date[11:19], author_name, text.lower()))