20q / modeling_twentyq.py

Upload folder using huggingface_hub

00cfc63 verified 2 months ago

12.6 kB

	"""TwentyQ: The world's smallest chat model.

	2-bit quantized neural network (1988), 156 attention heads, 1200 output classes.
	Trained on ~75 million conversations. Context window: 20 questions.
	"""

	import hashlib
	import random
	import torch
	import torch.nn as nn
	from transformers import PreTrainedModel, GenerationMixin
	from .configuration_twentyq import TwentyQConfig


	# Answer codes: 1=No(pol0), 2=Yes(pol1), 3=Probably(pol0), 4=Doubtful(pol1), 5=Maybe(pol0), 6=Unknown
	POLARITY = [0, 0, 1, 0, 1, 0, 0]
	MATCH_BONUS = [0, 4, 4, 3, 3, 1, 0]
	MISS_PENALTY = [0, 4, 4, 1, 1, 0, 0]

	ANSWER_WORDS = {
	"yes": 2, "y": 2, "yeah": 2, "yep": 2, "usually": 2,
	"no": 1, "n": 1, "nope": 1, "nah": 1,
	"probably": 3, "prob": 3, "likely": 3,
	"doubtful": 4, "doubt": 4, "rarely": 4,
	"maybe": 5, "sometimes": 5, "perhaps": 5, "partly": 5,
	"unknown": 6, "dunno": 6, "idk": 6, "irrelevant": 6, "skip": 6,
	"close": -1,
	}

	AVM_WORDS = {"animal": 1, "vegetable": 2, "mineral": 3, "other": 4}


	class TwentyQForCausalLM(PreTrainedModel, GenerationMixin):
	config_class = TwentyQConfig
	_tied_weights_keys = []

	def __init__(self, config):
	super().__init__(config)
	self.all_tied_weights_keys = {}
	self._dummy = nn.Parameter(torch.zeros(1), requires_grad=False)
	self.register_buffer("weight_matrix", torch.zeros(config.num_questions, config.num_targets, dtype=torch.uint8))
	self._vocab_loaded = False

	def set_vocab(self, questions, targets):
	"""Set question and target strings (called by tokenizer or manually)."""
	self.questions_str = list(questions)
	self.targets_str = list(targets)
	self._q_lookup = {q.lower(): i for i, q in enumerate(self.questions_str)}
	self._t_lookup = {t.lower(): i for i, t in enumerate(self.targets_str)}
	self._vocab_loaded = True

	def _ensure_strings(self):
	if self._vocab_loaded:
	return
	raise RuntimeError(
	"Model vocabulary not loaded. Call model.set_vocab(questions, targets) "
	"or load a tokenizer with vocab.json alongside the model."
	)

	def forward(self, input_ids=None, **kwargs):
	# Dummy forward — the real work happens in generate()
	batch = input_ids.shape[0] if input_ids is not None else 1
	return {"logits": torch.zeros(batch, 1, self.config.vocab_size)}

	def generate(self, input_ids=None, attention_mask=None, **kwargs):
	self._ensure_strings()
	# Decode input_ids to text (byte-level tokenizer, filter specials > 255)
	ids = input_ids[0].tolist()
	raw_bytes = bytes(b for b in ids if b < 256)
	text = raw_bytes.decode("utf-8", errors="replace")

	# Parse conversation and get next response
	answers, qnum, last_was_guess, game_over_msg, unrecognized = self._parse_conversation(text)

	if unrecognized:
	response = f"I didn't understand that. Please answer: {unrecognized}"
	elif game_over_msg:
	response = game_over_msg
	else:
	# Seed RNG from conversation for deterministic play
	seed = int(hashlib.md5(text.encode()).hexdigest()[:8], 16)
	self._rng = random.Random(seed)
	response = self._next_move(answers, qnum, last_was_guess)

	response_ids = list(response.encode("utf-8"))
	response_tensor = torch.tensor([response_ids], dtype=input_ids.dtype, device=input_ids.device)
	return torch.cat([input_ids, response_tensor], dim=1)

	def _parse_conversation(self, text):
	"""Parse chat-templated text into game state."""
	answers = [] # [(q_idx, ans_code, is_guess)]
	qnum = 0
	last_was_guess = False
	game_over_msg = None
	unrecognized = None # set to hint string if last answer wasn't understood

	# Split into turns by [A] and [U] markers
	parts = text.replace("\r", "").split("\n")
	turns = []
	for line in parts:
	line = line.strip()
	if line.startswith("[A] "):
	turns.append(("a", line[4:].strip()))
	elif line.startswith("[U] "):
	turns.append(("u", line[4:].strip()))

	# Pair up assistant/user turns
	i = 0
	while i < len(turns):
	if turns[i][0] == "a":
	a_msg = turns[i][1]
	u_msg = turns[i + 1][1] if i + 1 < len(turns) and turns[i + 1][0] == "u" else None

	if u_msg is None:
	# This is the generation prompt — no user response yet
	break

	u_lower = u_msg.lower().strip().rstrip(".")

	if "animal, vegetable, mineral" in a_msg.lower():
	# AVM question
	avm_code = AVM_WORDS.get(u_lower, 0)
	if avm_code:
	answers.append((0, avm_code, False))
	qnum += 1
	unrecognized = None
	else:
	unrecognized = "Animal, Vegetable, Mineral, or Other"
	i += 2

	elif a_msg.lower().startswith("i'm guessing"):
	# Guess
	target_name = a_msg.split("...")[-1].strip().rstrip("?").strip()
	t_idx = self._t_lookup.get(target_name.lower(), -1)

	ans_code = ANSWER_WORDS.get(u_lower, 0)
	if ans_code == 2: # Yes — correct guess
	game_over_msg = f"I win! Got it in {qnum + 1} questions."
	unrecognized = None
	elif ans_code == 1 or ans_code == -1: # No or Close
	if t_idx >= 0:
	answers.append((t_idx, 0, True))
	qnum += 1
	unrecognized = None
	else:
	unrecognized = "Yes, No, or Close"
	i += 2

	elif a_msg.lower().startswith("i win") or a_msg.lower().startswith("i'm stumped"):
	# Game already over
	game_over_msg = a_msg
	i += 2

	else:
	# Regular question
	q_text = a_msg.rstrip("?").strip()
	q_idx = self._q_lookup.get(q_text.lower(), -1)
	ans_code = ANSWER_WORDS.get(u_lower, 0)
	if ans_code == -1 or ans_code == 0:
	unrecognized = "Yes, No, Probably, Doubtful, Maybe, or Unknown"
	else:
	unrecognized = None
	if q_idx >= 0:
	answers.append((q_idx, ans_code, False))
	qnum += 1
	i += 2
	else:
	i += 1

	return answers, qnum, last_was_guess, game_over_msg, unrecognized

	def _next_move(self, answers, qnum, last_was_guess):
	if qnum == 0:
	return "Is it Animal, Vegetable, Mineral, or Other?"

	if qnum >= 30:
	return "I'm stumped! I can't figure out what you're thinking of."

	nc, best_t, best_s, cidx, cscores = self._rank_targets(answers)

	if nc == 0:
	return "I'm stumped! I can't figure out what you're thinking of."

	should_guess = (
	nc == 1 or qnum == 20 or qnum == 24 or qnum == 30
	or (qnum >= 18 and nc <= 2)
	)

	if should_guess:
	return f"I'm guessing... {self.targets_str[best_t]}?"

	q = self._select_question(answers, nc, cidx)
	if q < 0:
	return f"I'm guessing... {self.targets_str[best_t]}?"

	return f"{self.questions_str[q]}?"

	def _score(self, answer_code, target, question):
	w = int(self.weight_matrix[question, target])
	if (POLARITY[answer_code] ^ w) & 1:
	s = -MISS_PENALTY[answer_code]
	else:
	s = MATCH_BONUS[answer_code]
	if w & 2:
	s *= 2
	return s

	def _rank_targets(self, answers):
	max_c = 16 if len(answers) <= 10 else (8 if len(answers) <= 12 else 5)
	c_scores = [0] * max_c
	c_indices = [0] * max_c
	nc = 0
	best_t, best_s = 0, 0

	for t in range(self.config.num_targets):
	guessed = any(qi == t and ig for qi, _, ig in answers)
	if guessed:
	continue

	score = 0
	skip = False
	for qi, ac, ig in answers:
	if ig or ac == 0:
	continue
	if qi != 0:
	score += self._score(ac, t, qi)
	else:
	for k in range(4):
	score += self._score(4 if k + 1 == ac else 3, t, k)
	if len(answers) > 7 and score < 0:
	skip = True
	break

	if skip or score < 0:
	continue

	score += self._rng.randint(0, 7)

	if nc < max_c:
	slot = nc
	nc += 1
	else:
	min_s, slot = min((c_scores[j], j) for j in range(max_c))
	if min_s >= score:
	continue

	c_scores[slot] = score
	c_indices[slot] = t
	if score > best_s:
	best_t, best_s = t, score

	thresh = best_s // 4
	thresh = max(5, min(20, thresh))
	cutoff = best_s - thresh
	pi = [(c_indices[j], c_scores[j]) for j in range(nc) if c_scores[j] > cutoff]
	if not pi:
	return 0, best_t, best_s, [], []
	idx, sc = zip(*pi)
	return len(pi), best_t, best_s, list(idx), list(sc)

	def _select_question(self, answers, nc, cidx):
	best_s, best_q = -1000, -1
	asked = {qi for qi, _, ig in answers if not ig}

	for q in range(4, self.config.num_questions):
	if q in asked:
	continue
	pos, neg = 0, 0
	for t in cidx:
	w = int(self.weight_matrix[q, t])
	wt = 3 if (w & 2) else 1
	if w & 1:
	neg += wt
	else:
	pos += wt

	s = (pos * 2 - neg) if pos <= neg else (neg * 2 - pos)
	s += self._rng.randint(0, 7)
	if s > best_s:
	best_s, best_q = s, q

	return best_q

	def play(self, tokenizer=None):
	"""Interactive CLI mode. Pass the tokenizer for proper chat template formatting."""
	self._ensure_strings()

	if tokenizer is None:
	# Minimal fallback — construct chat text directly
	from .tokenization_twentyq import TwentyQTokenizer
	tokenizer = TwentyQTokenizer()
	tokenizer.chat_template = (
	"{% if messages[0]['role'] == 'system' %}{{ messages[0]['content'] }}\n"
	"{% set loop_messages = messages[1:] %}{% else %}"
	"{% set loop_messages = messages %}{% endif %}"
	"{% for message in loop_messages %}"
	"{% if message['role'] == 'assistant' %}[A] {{ message['content'] }}\n"
	"{% elif message['role'] == 'user' %}[U] {{ message['content'] }}\n"
	"{% endif %}{% endfor %}"
	"{% if add_generation_prompt %}[A] {% endif %}"
	)

	messages = [
	{"role": "system", "content": "Think of something and I'll try to guess it in 20 questions."},
	]
	print("\n Think of something...\n")
	input(" Press Enter when ready... ")

	while True:
	text = tokenizer.apply_chat_template(messages, add_generation_prompt=True, tokenize=False)
	ids = tokenizer.encode(text, return_tensors="pt")
	out = self.generate(ids)
	response = tokenizer.decode(out[0, ids.shape[1]:].tolist())

	messages.append({"role": "assistant", "content": response})
	print(f"\n > {response}")

	if "I win" in response or "stumped" in response:
	return

	if "Animal, Vegetable, Mineral" in response:
	hint = "(Animal/Vegetable/Mineral/Other)"
	elif "guessing" in response.lower():
	hint = "(Yes/No/Close)"
	else:
	hint = "(Yes/No/Probably/Doubtful/Maybe/Unknown)"

	reply = input(f" {hint}: ").strip()
	if not reply:
	return
	messages.append({"role": "user", "content": reply})