# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
# -*- coding: utf-8 -*- import re from mechanize import Browser # , root_url = 'http://habrahabr.ru/' login_url = 'http://habrahabr.ru/login/' username = 'krig' userpass = '******' comments_re = r 'habrahabr\.ru/blog.*/#comments' count_re = re . compile ( '(\d+)\s*\+(\d+)' ) post_id_re = re . compile ( 'habrahabr\.ru/blog.*/(\d+)/#comments' ) def is_logged_in (page_text): return not login_url in page_text br = Browser() home_page = br. open (root_url) print ' ' , br.title() # , if not is_logged_in (home_page.read()): print " " br.follow_link(text= '' ) br.select_form(name= "login" ) br[ "login" ] = username br[ "password" ] = userpass result_page = br.submit() if not is_logged_in (result_page.read()): print " " exit( 1 ) else : print " " , username # max = zero_comments = 0 title = url = '' print " " br. open (root_url) # , # , , br.links(...) # for comments_url in [url for url in br.links(url_regex=comments_re)]: m = count_re.search(comments_url.text) # , if not m: zero_comments += 1 else : if int (m.group( 1 )) > max: max = int (m.group( 1 )) habrapost_id = post_id_re.search(comments_url.absolute_url).group( 1 ) post_url = [url for url in br.links(url_regex=r 'habrahabr\.ru/blog.*/' + habrapost_id + '/?$' )][0] title = post_url.text url = post_url.absolute_url print ' :' , zero_comments print ' :' , max if max: print ' :' , title print ' :' , url
$ python habratest.py Welcome to Habrahabr Trying to login Successfully logged in as krig We are starting to search for articles on the main page. Habratopikov without habrakatment: 0 Maximum number of habrakazment: 72 Most Commented Topic: Free Computers And it is located at: http://habrahabr.ru/blogs/startup_ideas/52540/
Source: https://habr.com/ru/post/52554/
All Articles