Files
clients/WebBasedCrawler/insta/instaheaders.py

107 lines
5.6 KiB
Python

def get_headers_for_list_html():
return {"accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8",
"accept-encoding": "gzip, deflate, sdch, br",
"accept-language": "ko-KR,ko;q=0.8,en-US;q=0.6,en;q=0.4",
"user-agent": "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko)"
" Chrome/50.0.2661.102 Safari/537.36"
}
def get_headers_for_body_html(cookies):
if cookies:
request_headers = {
"accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8",
"accept-encoding": "gzip, deflate, sdch, br",
"accept-language": "ko-KR,ko;q=0.8,en-US;q=0.6,en;q=0.4",
"user-agent": "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko)"
" Chrome/50.0.2661.102 Safari/537.36",
"upgrade-insecure-requests": "1",
"cache-control": "max-age=0",
# 'cookie': 'mid=' + cookies['mid'] + '; sessionid=' + cookies['sessionid'] +
# '; ig_pr=1; ig_vw=1920; csrftoken=' + cookies['csrftoken'] + "; s_network="
'cookie': ((('mid=' + cookies['mid'] + '; ') if cookies.get('mid', None) else '') + \
(('sessionid=' + cookies['sessionid'] + '; ') if cookies.get('sessionid', None) else '') + \
(('csrftoken=' + cookies['csrftoken'] + '; ') if cookies.get('csrftoken', None) else '') + \
(('ds_user_id=' + cookies['ds_user_id'] + '; ') if cookies.get('ds_user_id', None) else '')) + \
'ig_pr=1; ig_vw=1920; s_network='
}
else:
request_headers = {
"accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8",
"accept-encoding": "gzip, deflate, sdch, br",
"accept-language": "ko-KR,ko;q=0.8,en-US;q=0.6,en;q=0.4",
"user-agent": "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko)"
" Chrome/50.0.2661.102 Safari/537.36",
"upgrade-insecure-requests": "1",
"cache-control": "max-age=0"
}
return request_headers
def get_headers_for_ajax(cookies, referer, form_data):
request_headers = {
'accept': 'application/json, text/javascript, */*; q=0.01',
'accept-encoding': 'gzip, deflate, br',
'accept-language': 'ko-KR,ko;q=0.8,en-US;q=0.6,en;q=0.4',
'content-type': 'application/x-www-form-urlencoded; charset=UTF-8',
'origin': 'https://www.instagram.com',
'user-agent': 'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) '
'Chrome/50.0.2661.102 Safari/537.36',
'cookie': ((('mid=' + cookies['mid'] + '; ') if cookies.get('mid', None) else '') + \
(('sessionid=' + cookies['sessionid'] + '; ') if cookies.get('sessionid', None) else '') + \
(('csrftoken=' + cookies['csrftoken'] + '; ') if cookies.get('csrftoken', None) else '') + \
(('ds_user_id=' + cookies['ds_user_id'] + '; ') if cookies.get('ds_user_id', None) else '')) + \
'ig_pr=1; ig_vw=1920; s_network=',
'x-csrftoken': cookies['csrftoken'],
'x-instagram-ajax': 1,
'x-requested-with': 'XMLHttpRequest',
'referer': referer,
'content-length': str(len(form_data)),
'connection': 'keep-alive'
}
return request_headers
def get_form_data_for_list_user(user_id, end_cursor, count):
res = 'q=ig_user(' \
+ str(user_id) + \
')+%7B+media.after(' \
+ str(end_cursor) + \
'%2C+' \
+ str(count) + \
')+%7B%0A++count%2C%0A++nodes+%7B%0A++++caption%2C%0A++++code%2C%0A++++comments+%7B%0A++++++' \
'count%0A++++%7D%2C%0A++++date%2C%0A++++dimensions+%7B%0A++++++height%2C%0A++++++width%0A++++' \
'%7D%2C%0A++++display_src%2C%0A++++id%2C%0A++++is_video%2C%0A++++likes+%7B%0A++++++count%0A++++' \
'%7D%2C%0A++++owner+%7B%0A++++++id%0A++++%7D%2C%0A++++thumbnail_src%2C%0A++++video_views%0A++%7D%2C%0A++' \
'page_info%0A%7D%0A+%7D&ref=users%3A%3Ashow'
return res
def get_form_data_for_list_tag(hash_tag, end_cursor, count):
res = 'q=ig_hashtag(' \
+ str(hash_tag) + \
')+%7B+media.after(' \
+ str(end_cursor) + \
'%2C+' + str(count) + \
')+%7B%0A++count%2C%0A++nodes+%7B%0A++++caption%2C%0A++++code%2C%0A++++comments+%7B%0A++++++count%0A++++' \
'%7D%2C%0A++++date%2C%0A++++dimensions+%7B%0A++++++height%2C%0A++++++width%0A++++%7D%2C%0A++++' \
'display_src%2C%0A++++id%2C%0A++++is_video%2C%0A++++likes+%7B%0A++++++count%0A++++%7D%2C%0A++++' \
'owner+%7B%0A++++++id%0A++++%7D%2C%0A++++thumbnail_src%2C%0A++++video_views%0A++%7D%2C%0A++' \
'page_info%0A%7D%0A+%7D&ref=tags%3A%3Ashow'
return res
def get_form_data_for_reply(body_code, start_cursor, count):
res = 'q=ig_shortcode(' \
+ str(body_code) + ')+%7B%0A++comments.before' \
'(%0A++++++++++++' \
+ str(start_cursor) + \
'%2C%0A++++++++++++' \
+ str(count) + \
'%0A++++++++++)' \
'+%7B%0A++++count%2C%0A++++nodes+%7B%0A++++++id%2C%0A++++++' \
'created_at%2C%0A++++++text%2C%0A++++++user+%7B%0A++++++++id%2C%0A++++++++' \
'profile_pic_url%2C%0A++++++++username%0A++++++%7D%0A++++%7D%2C%0A++++' \
'page_info%0A++%7D%0A%7D%0A&ref=media%3A%3Ashow'
return res