
154 lines
4.3 KiB
Raw Normal View History

2022-02-21 21:03:28 +00:00
from argparse import ArgumentParser
from asyncio import create_task, sleep, run
from random import randint, choice
2022-07-17 20:50:29 +00:00
from re import sub
2022-02-21 18:30:20 +00:00
from transformers import AutoTokenizer, AutoModelForCausalLM
2022-02-21 22:40:27 +00:00
2022-02-21 21:03:28 +00:00
parser = ArgumentParser()
2022-02-23 00:00:10 +00:00
parser.add_argument('-n', '--input', help='initial input text')
parser.add_argument('-b', '--backend', choices=['mastodon', 'misskey', 'matrix'],
action='append', help='fediverse server type')
parser.add_argument('-i', '--instance', action='append',
help='Mastodon instance hosting the bot')
parser.add_argument('-t', '--token', action='append',
help='Mastodon application access token')
2022-02-23 16:07:50 +00:00
parser.add_argument('-d', '--data', default='data',
help='data for automatic input generation')
parser.add_argument('-m', '--model', default='model',
2022-02-21 22:47:59 +00:00
help='path to load saved model')
parser.add_argument('-y', '--yes', action='store_true',
help='answer yes to all prompts')
2022-02-21 21:03:28 +00:00
args = parser.parse_args()
2022-07-17 15:48:11 +00:00
tokenizer = AutoTokenizer.from_pretrained('gpt2-large')
model = AutoModelForCausalLM.from_pretrained(args.model).to('cuda')
2022-02-21 18:30:20 +00:00
2022-02-21 21:03:28 +00:00
def generate_input():
# Create random input
if randint(0, 1) == 0:
return choice([
'I am',
'My life is',
'Computers are',
'This is',
'No one',
'I love',
'I will die of',
'I\'m going to die',
'My favorite',
'I\'m not',
'I hate',
2022-02-23 16:15:16 +00:00
'I think',
'In my opinion',
'Breaking news:',
'Have I ever told you that',
'I read on the news that',
'I never knew that',
'My dream is',
2022-07-17 21:46:17 +00:00
'It\'s terrible that',
'My new theory:',
'My conspiracy theory',
'The worst thing'
2022-02-23 16:07:50 +00:00
with open(args.data, 'r') as f:
2022-02-23 21:31:02 +00:00
# Get a line with at least two words
lines = f.readlines()
line = choice(lines).split()
while len(line) < 2:
line = choice(lines).split()
2022-02-23 21:31:02 +00:00
return line[0] + ' ' + line[1]
if args.input is None:
args.input = generate_input()
2022-02-21 22:40:27 +00:00
# Loop until we're satisfied
while True:
# Run the input through the model
inputs = tokenizer.encode(args.input, return_tensors='pt').to('cuda')
output = tokenizer.decode(model.generate(
inputs, max_length=150, do_sample=True, top_p=0.9)[0])
2022-02-28 00:00:22 +00:00
# Prepare the post
output = output.split('\n')
post = output[0]
if len(post) < 200 and len(output) > 1:
post = output[0] + '\n' + output[1]
post = post[:500]
# Remove mentions
post = sub('(@[^ ]*)@[^ ]*', '\\1', post)
2022-07-17 20:50:29 +00:00
if args.yes:
# Prompt the user
res = input('Post/Retry/New input/Custom input/Quit: ')
if res not in 'prnPRNcC':
if res in 'pP':
if res in 'nN':
args.input = generate_input()
if res in 'cC':
args.input = input('Enter custom input: ')
2022-07-17 20:50:29 +00:00
2022-02-28 00:00:22 +00:00
# Post it!
for backend, instance, token in zip(args.backend, args.instance, args.token):
if backend == 'mastodon':
from mastodon import Mastodon
2022-02-28 00:00:22 +00:00
mastodon = Mastodon(
2022-03-01 04:23:05 +00:00
elif backend == 'misskey':
from Misskey import Misskey
2022-02-28 00:00:22 +00:00
misskey = Misskey(instance, i=token)
2022-03-01 04:23:05 +00:00
elif backend == 'matrix':
import simplematrixbotlib as botlib
2022-03-01 04:23:05 +00:00
creds = botlib.Creds(instance, 'ebooks', token)
bot = botlib.Bot(creds)
2022-03-01 04:23:05 +00:00
async def room_joined(room_id):
await bot.api.send_text_message(room_id=room_id, message=post)
2022-03-01 04:23:05 +00:00
async def wait_quit():
await sleep(5)
async def run_bot():
run = create_task(bot.main())
wait = create_task(wait_quit())
await run
await wait