(?:(.*?)(?: ...)?

|\n.*?.*?(.*?)

)''' matches = re.finditer(pattern, string) num = 0 for match in matches: parsed[num] = {'url' : match.group(1), 'text' : match.group(2), 'summary' : match.group(3) or match.group(4)} num += 1 return parsed def search(query, cookie, page=0, full=False): """ main function, returns parsed results Args: query - search string cookie - facebook cookie page - search result page number (optional) """ offset = page * 10 full = 1 if False else 0 escaped = url_encode('https://google.com/search?q=%s&start=%i&filter=%i' % (url_encode(query), offset, full)) headers = { 'Host': 'developers.facebook.com', 'User-Agent': 'Mozilla/5.0 (X11; Linux x86_64; rv:68.0) Gecko/20100101 Firefox/68.0', 'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8', 'Accept-Language': 'en-US,en;q=0.5', 'Accept-Encoding': 'deflate', 'Connection': 'keep-alive', 'Cookie': cookie, 'Upgrade-Insecure-Requests': '1', 'Cache-Control': 'max-age=0', 'TE': 'Trailers' } response = requests.get('https://developers.facebook.com/tools/debug/echo/?q=%s' % escaped, headers=headers) cleaned_response = decode_html(response.text) parsed = parse(cleaned_response) return parsed