bypass-all-shortlinks-deblo.../2_generate_includes.py

import re

def extract_regex_from_js(js_code):
    pattern1 = r'BypassedByBloggerPemula\((.*?),'
    matches1 = re.findall(pattern1, js_code)
    matches1 = [match.strip('/') for match in matches1]
    
    pattern2 = r"BloggerPemula\('([^']+)',"
    matches2 = re.findall(pattern2, js_code)
    #matches2 = ['/' + s + '/' for s in matches2]

    pattern3 = r"RemoveBp\('([^']+)',"
    matches3 = re.findall(pattern3, js_code)

    pattern4 = r'case \'(.*?)\':'
    matches4 = re.findall(pattern4, js_code)

    pattern5 = r"h\.href\.includes\('(.*?)'\)"
    matches5 = re.findall(pattern5, js_code)

    return matches1+matches2+matches3+matches4+matches5

def regex_to_include_line(regex):
    #regex = regex.strip("/")

    #Use @include for more complex regex
    if any(char in regex for char in ['|', '(', ')', '*']):
        regex = '(' + regex + ')'
        include_line = "// @include /^(https?:\/\/)(.+)?" + regex + "(\/.*)/"
        include_line = include_line.replace( "\.*)(\/.*)/", "\.*)/" ) #clean excess in the regex

    #Use @match for simpler regex
    else:
        include_line = '// @match *://*.' + regex + '/*'

    return include_line

def generate_include_lines(regex_list):
    include_lines = []
    for regex in regex_list:
        include_line = regex_to_include_line(regex)
        include_lines.append(include_line)

    return include_lines

def write_to_file(filename, lines):
    with open(filename, 'w', encoding='utf-8') as file:
        for line in lines:
            file.write(line + '\n')
    print(f"OK: Generated {filename}")

def compile_and_print(regex_strings):
    #for regex_string in regex_strings: print(regex_string)
    write_to_file('supported_sites.txt', regex_strings)

    include_lines = generate_include_lines(regex_strings)
    print(f"OK: Generated {len(include_lines)} include lines.")
    
    #for line in include_lines: print(line)
    write_to_file('includes.txt', include_lines)


def main():
    file_path = 'untouched_Bypass_All_Shortlinks.user.js'
    
    try:
        with open(file_path, 'r', encoding='utf-8') as file:
            js_code = file.read()

            regex_strings = extract_regex_from_js(js_code)

            # remove short domains (errors)
            regex_strings = [s for s in regex_strings if "." in s and len(s) >= 5]
            
            # remove domains with blocked words
            blocked_words_for_includes = [
                "google",
                "youtube" #youtube is for redirecting shorts, but I remove it to avoid people worrying
            ]
            regex_strings = [s for s in regex_strings if not any(word in s for word in blocked_words_for_includes)]

            compile_and_print(regex_strings)
    except FileNotFoundError:
        print(f"Error: File '{file_path}' not found.")
    except Exception as e:
        print(f"An error occurred: {e}")

if __name__ == "__main__":
    main()
Upload files to "/" 2024-01-18 06:12:01 +05:00			`import re`

			`def extract_regex_from_js(js_code):`
			`pattern1 = r'BypassedByBloggerPemula\((.*?),'`
			`matches1 = re.findall(pattern1, js_code)`
			`matches1 = [match.strip('/') for match in matches1]`

			`pattern2 = r"BloggerPemula\('([^']+)',"`
			`matches2 = re.findall(pattern2, js_code)`
			`#matches2 = ['/' + s + '/' for s in matches2]`

			`pattern3 = r"RemoveBp\('([^']+)',"`
			`matches3 = re.findall(pattern3, js_code)`

			`pattern4 = r'case \'(.*?)\':'`
			`matches4 = re.findall(pattern4, js_code)`

			`pattern5 = r"h\.href\.includes\('(.*?)'\)"`
			`matches5 = re.findall(pattern5, js_code)`

			`return matches1+matches2+matches3+matches4+matches5`

			`def regex_to_include_line(regex):`
			`#regex = regex.strip("/")`
use match rules instead of include rules whenever possible 2024-01-19 22:13:39 +05:00
			`#Use @include for more complex regex`
use include instead of match for some other complex regex 2024-01-20 04:56:46 +05:00			`if any(char in regex for char in ['\|', '(', ')', '*']):`
use match rules instead of include rules whenever possible 2024-01-19 22:13:39 +05:00			`regex = '(' + regex + ')'`
			`include_line = "// @include /^(https?:\/\/)(.+)?" + regex + "(\/.*)/"`
			`include_line = include_line.replace( "\.)(\/.)/", "\.*)/" ) #clean excess in the regex`

			`#Use @match for simpler regex`
			`else:`
			`include_line = '// @match ://.' + regex + '/*'`
Upload files to "/" 2024-01-18 06:12:01 +05:00
			`return include_line`

			`def generate_include_lines(regex_list):`
			`include_lines = []`
			`for regex in regex_list:`
			`include_line = regex_to_include_line(regex)`
			`include_lines.append(include_line)`

			`return include_lines`

			`def write_to_file(filename, lines):`
removed non-english, added metadata removed non-english descriptions, added a metadata file, specified file encoding for writting and reading 2024-01-25 21:27:17 +05:00			`with open(filename, 'w', encoding='utf-8') as file:`
Upload files to "/" 2024-01-18 06:12:01 +05:00			`for line in lines:`
			`file.write(line + '\n')`
			`print(f"OK: Generated {filename}")`

			`def compile_and_print(regex_strings):`
			`#for regex_string in regex_strings: print(regex_string)`
remove google domain and make supported sites list visible 2024-01-19 18:32:10 +05:00			`write_to_file('supported_sites.txt', regex_strings)`
Upload files to "/" 2024-01-18 06:12:01 +05:00
			`include_lines = generate_include_lines(regex_strings)`
			`print(f"OK: Generated {len(include_lines)} include lines.")`

			`#for line in include_lines: print(line)`
			`write_to_file('includes.txt', include_lines)`

remove google domain and make supported sites list visible 2024-01-19 18:32:10 +05:00
Upload files to "/" 2024-01-18 06:12:01 +05:00			`def main():`
			`file_path = 'untouched_Bypass_All_Shortlinks.user.js'`

			`try:`
			`with open(file_path, 'r', encoding='utf-8') as file:`
			`js_code = file.read()`
add recaptcha and shrinkme.us to includes add recaptcha/api2 to match, so they are auto open when that option is enabled. Also added domain shrinkme.us which has one of those captchas 2024-01-21 00:45:53 +05:00
Upload files to "/" 2024-01-18 06:12:01 +05:00			`regex_strings = extract_regex_from_js(js_code)`
add recaptcha and shrinkme.us to includes add recaptcha/api2 to match, so they are auto open when that option is enabled. Also added domain shrinkme.us which has one of those captchas 2024-01-21 00:45:53 +05:00
simplify script code and remove the manually added domain which is not necessary 2024-01-21 15:02:58 +05:00			`# remove short domains (errors)`
remove google and recaptcha domains. they can be enabled manually 2024-01-25 13:21:58 +05:00			`regex_strings = [s for s in regex_strings if "." in s and len(s) >= 5]`
simplify script code and remove the manually added domain which is not necessary 2024-01-21 15:02:58 +05:00
remove google and recaptcha domains. they can be enabled manually 2024-01-25 13:21:58 +05:00			`# remove domains with blocked words`
			`blocked_words_for_includes = [`
			`"google",`
			`"youtube" #youtube is for redirecting shorts, but I remove it to avoid people worrying`
			`]`
			`regex_strings = [s for s in regex_strings if not any(word in s for word in blocked_words_for_includes)]`
add recaptcha and shrinkme.us to includes add recaptcha/api2 to match, so they are auto open when that option is enabled. Also added domain shrinkme.us which has one of those captchas 2024-01-21 00:45:53 +05:00
Upload files to "/" 2024-01-18 06:12:01 +05:00			`compile_and_print(regex_strings)`
			`except FileNotFoundError:`
			`print(f"Error: File '{file_path}' not found.")`
			`except Exception as e:`
			`print(f"An error occurred: {e}")`

			`if __name__ == "__main__":`
			`main()`