gate_exam_papersg4g.py

import requests
from bs4 import *
import re
data = requests.get("http://www.geeksforgeeks.org/")
soup = BeautifulSoup(data.text, 'html.parser')
data1 = soup.find_all('hgroup')
#data2 = data1[1].find_all('a')
#print (data2)
for link in data1[1].find_all('a', href=True, text='GATE CS'):
    nextlink = link['href']
url = requests.get(str(nextlink))
soup = BeautifulSoup(url.text, 'html.parser')
#print (soup)
i=1
list1 = soup.find_all('a', href=True, text=re.compile('^GATE-CS'))
list2 = soup.find_all('a', href=True, text=re.compile('^GATE\sCS\s20..$'))
for link in list1:
    link1 =  link['href']
    #print (link1)
    filename = 'gateprep-'+str(i);
    with open(filename, 'w') as handle:
        finalpage = requests.get(link1)
        soup = BeautifulSoup(finalpage.text, 'html.parser')
        data3 = soup.find('div', id="mtq_question_container-1")
        data4 = data3.find('div')
        divs = data4.find_all('div',{'class':'mtq_question mtq_scroll_item-1'})
        try:
            for div in divs:
                nd1 = div.find('div',{'class':'mtq_question_label'})
                #print (nd1.text)
                handle.writelines(nd1.text)
                handle.writelines("\n")
                nd2 = div.find('div',{'class':'mtq_question_text'})
                handle.writelines(nd2.text)
                #print (nd2.text)
                handle.writelines("\n")
                nd3 = div.find_all('div',{'class':'mtq_answer_text'})
                count=1
                for ans in nd3:
                    st = "("+str(count)+")"
                    handle.writelines(st)
                    handle.writelines(ans.text)
                    #print (ans.text)
                    handle.writelines("\n")
                    count+=1
                handle.writelines("\n\n\n")
                try:
                    nd4 = div.find('div',{'class':'mtq_explanation-label'})
                    handle.writelines(nd4.text)
                    #print (nd4.text)
                    handle.writelines("\n")
                    nd5 = div.find('div',{'class':'mtq_explanation-text'})
                    handle.writelines(nd5.text)
                    #print (nd5.text)
                    handle.writelines("\n")
                except Exception as e:
                    pass
                handle.writelines("\n\n\n")
            #print ("executed successfully!")
            i+=1
        except Exception as e:
            print (e)
for link in list2:
    link2 =  link['href']
    #print (link2)
    filename = 'gateprep-'+str(i);
    with open(filename, 'w') as handle:
        finalpage = requests.get(link1)
        soup = BeautifulSoup(finalpage.text, 'html.parser')
        data3 = soup.find('div', id="mtq_question_container-1")
        data4 = data3.find('div')
        divs = data4.find_all('div',{'class':'mtq_question mtq_scroll_item-1'})
        try:
            for div in divs:
                nd1 = div.find('div',{'class':'mtq_question_label'})
                #print (nd1.text)
                handle.writelines(nd1.text)
                handle.writelines("\n")
                nd2 = div.find('div',{'class':'mtq_question_text'})
                handle.writelines(nd2.text)
                #print (nd2.text)
                handle.writelines("\n")
                nd3 = div.find_all('div',{'class':'mtq_answer_text'})
                count=1
                for ans in nd3:
                    st = "("+str(count)+")"
                    handle.writelines(st)
                    handle.writelines(ans.text)
                    #print (ans.text)
                    handle.writelines("\n")
                    count+=1
                handle.writelines("\n\n\n")
                try:
                    nd4 = div.find('div',{'class':'mtq_explanation-label'})
                    handle.writelines(nd4.text)
                    #print (nd4.text)
                    handle.writelines("\n")
                    nd5 = div.find('div',{'class':'mtq_explanation-text'})
                    handle.writelines(nd5.text)
                    #print (nd5.text)
                    handle.writelines("\n")
                except Exception as e:
                    pass
                handle.writelines("\n\n\n")
            #print ("executed successfully!")
            i+=1
        except Exception as e:
            print (e)
print ("Successfully saved all the files :)")