Build a Stack Exchange Scraper

  • + 0 comments
    import re
    import sys
    t=sys.stdin.read()
    a=re.findall(r"(?<=questions\/)\d+(?=\/)",t)
    b=re.findall(r"(?<=hyperlink\"\>).+(?=\<\/a\>)",t)
    c=re.findall(r"(?<=relativetime\"\>).+(?=\<)",t)
    l=list()
    for i in range(len(a)):
        l.append(a[i])
        l.append(b[i])
        l.append(c[i])
        print(";".join(l))
        l=[]