pakkinlau/gpt2md.py

## gpt2md.py
"""
This script automatically converts the output of GPT-3 to markdown format.

Future: convert this script to be a chrome extension.


For linux users, they might need to install `xclip` or `xsel` to find clipboard mechanism.

`sudo apt-get install xclip`: Install xclip
"""

import re
import pyperclip
import platform
import subprocess
import sys

# Detect the operating system
if platform.system() == "Linux":
    # Set clipboard mechanism to xclip for Linux systems
    try:
        subprocess.check_output(['xclip', '-version'])
    except subprocess.CalledProcessError:
        print("xclip is not installed. Attempting to install...")

        try:
            # Install xclip using the package manager (apt in this case)
            subprocess.check_call(['sudo', 'apt-get', 'install', 'xclip'])
            print("xclip installed successfully.")
        except subprocess.CalledProcessError:
            print("Failed to install xclip. Please install it manually.")
            sys.exit(1)
    pyperclip.set_clipboard("xclip")

gpt_response = pyperclip.paste()

def convert_text_pattern(text):
    # Define the patterns to match

    # caution, the order of the patterns matters
    #note: \[ --> [
    # \\ --> \
    patterns = {
        r'\n\s+\\\[': r'$$',  # match \[ followed by any number of spaces at the beginning of a line
        r'\n\s+\\\]': r'$$',  # match \] preceded by any number of spaces at the end of a line
        r"\\\[\s": r"$", # match \[ followed by a space
        r"\\\(\s": r"$", # match \( followed by a space
        r"\s\\\]": r"$$", # match \] preceded by a space
        r"\s\\\)": r"$", # match \) preceded by a space
        r"\\\[\n": r"$$", # match \[ followed by a newline
        r"\n\\\]": r"$$", # match \] preceded by a newline
        r"\\\(" : r"$", # match \(
        r"\\\)" : r"$", # match \)
        r"\\\]\n" : r"$$\n", # handling some cases of \] followed by a newline cannot be detected
        r"\\\]": r"$$", # matching some missing closing brackets
    }
    # prevent '\r' from being replaced


    # Iterate over patterns and replace them in the text
    for pattern, replacement in patterns.items():
        text = re.sub(pattern, replacement, text)
    return text


converted_text = convert_text_pattern(gpt_response)
pyperclip.copy(converted_text)
	"""
	This script automatically converts the output of GPT-3 to markdown format.

	Future: convert this script to be a chrome extension.


	For linux users, they might need to install `xclip` or `xsel` to find clipboard mechanism.

	`sudo apt-get install xclip`: Install xclip
	"""

	import re
	import pyperclip
	import platform
	import subprocess
	import sys

	# Detect the operating system
	if platform.system() == "Linux":
	# Set clipboard mechanism to xclip for Linux systems
	try:
	subprocess.check_output(['xclip', '-version'])
	except subprocess.CalledProcessError:
	print("xclip is not installed. Attempting to install...")

	try:
	# Install xclip using the package manager (apt in this case)
	subprocess.check_call(['sudo', 'apt-get', 'install', 'xclip'])
	print("xclip installed successfully.")
	except subprocess.CalledProcessError:
	print("Failed to install xclip. Please install it manually.")
	sys.exit(1)
	pyperclip.set_clipboard("xclip")

	gpt_response = pyperclip.paste()

	def convert_text_pattern(text):
	# Define the patterns to match

	# caution, the order of the patterns matters
	#note: \[ --> [
	# \\ --> \
	patterns = {
	r'\n\s+\\\[': r'$$', # match \[ followed by any number of spaces at the beginning of a line
	r'\n\s+\\\]': r'$$', # match \] preceded by any number of spaces at the end of a line
	r"\\\[\s": r"$", # match \[ followed by a space
	r"\\\(\s": r"$", # match \( followed by a space
	r"\s\\\]": r"$$", # match \] preceded by a space
	r"\s\\\)": r"$", # match \) preceded by a space
	r"\\\[\n": r"$$", # match \[ followed by a newline
	r"\n\\\]": r"$$", # match \] preceded by a newline
	r"\\\(" : r"$", # match \(
	r"\\\)" : r"$", # match \)
	r"\\\]\n" : r"$$\n", # handling some cases of \] followed by a newline cannot be detected
	r"\\\]": r"$$", # matching some missing closing brackets
	}
	# prevent '\r' from being replaced


	# Iterate over patterns and replace them in the text
	for pattern, replacement in patterns.items():
	text = re.sub(pattern, replacement, text)
	return text


	converted_text = convert_text_pattern(gpt_response)
	pyperclip.copy(converted_text)