url = 'https://raw.githubusercontent.com/first20hours/google-10000-english/master/google-10000-english-usa-no-swears-medium.txt'

!mkdir -p data
!wget -q {url} -P data


pattern='[^snake][^snake][^snake][^snake][^snake]'

!grep '^{pattern}$' 'data/google-10000-english-usa-no-swears-medium.txt' | head

which
would
world
group
could
right
forum
photo
topic
court


!grep '^{pattern}$' 'data/google-10000-english-usa-no-swears-medium.txt' | wc -l

108


pattern='[^msnakeous][^snakeous][^snakeous][^snakeous][^snakeous]'

!grep '^{pattern}$' 'data/google-10000-english-usa-no-swears-medium.txt' | head

which
right
light
child
third
civil
limit
birth
fight
width


!grep '^{pattern}$' 'data/google-10000-english-usa-no-swears-medium.txt' | wc -l

27


pattern='[^msnakeoust]r[^snakeoust][^snakeousti][^snakeoust]'

!grep '^{pattern}$' 'data/google-10000-english-usa-no-swears-medium.txt'

grill
drill


pattern='crim[^snakeoust]'

!grep '^{pattern}$' data/100k

crimp


pattern='[^moe][^moe][^moeu][^moes][^moe]'
!grep '^{pattern}$' data/100k | wc -l

2945


!grep '^{pattern}$' data/100k | head

which
click
links
right
using
black
think
shall
still
visit


!grep '(which|could)' data/100k


!grep -E '(which|could)' data/100k

which
could


!grep -P '(su...|us...)' data/100k | head

using
users
super
suite
usage
sugar
susan
usual
sunny
sudan


!grep -P '(su[^moe][^moe][^moe]|us[^moe][^moe][^moe])' data/100k | head

using
sugar
susan
usual
sunny
sudan
suits
sucks
supra
sushi


U = {0, 1, 3, 4}
S = {0, 1, 2, 4}

from itertools import product
combinations = [(u, s) for u, s in product(U, S) if u != s]
combinations

[(0, 1),
 (0, 2),
 (0, 4),
 (1, 0),
 (1, 2),
 (1, 4),
 (3, 0),
 (3, 1),
 (3, 2),
 (3, 4),
 (4, 0),
 (4, 1),
 (4, 2)]


patterns = []
for u, s in combinations:
    pattern = ['[^moe]'] * 5
    pattern[u] = 'u'
    pattern[s] = 's'
    patterns.append(''.join(pattern))
patterns

['us[^moe][^moe][^moe]',
 'u[^moe]s[^moe][^moe]',
 'u[^moe][^moe][^moe]s',
 'su[^moe][^moe][^moe]',
 '[^moe]us[^moe][^moe]',
 '[^moe]u[^moe][^moe]s',
 's[^moe][^moe]u[^moe]',
 '[^moe]s[^moe]u[^moe]',
 '[^moe][^moe]su[^moe]',
 '[^moe][^moe][^moe]us',
 's[^moe][^moe][^moe]u',
 '[^moe]s[^moe][^moe]u',
 '[^moe][^moe]s[^moe]u']


'|'.join(patterns)

'us[^moe][^moe][^moe]|u[^moe]s[^moe][^moe]|u[^moe][^moe][^moe]s|su[^moe][^moe][^moe]|[^moe]us[^moe][^moe]|[^moe]u[^moe][^moe]s|s[^moe][^moe]u[^moe]|[^moe]s[^moe]u[^moe]|[^moe][^moe]su[^moe]|[^moe][^moe][^moe]us|s[^moe][^moe][^moe]u|[^moe]s[^moe][^moe]u|[^moe][^moe]s[^moe]u'


!grep -P '({"|".join(patterns)})' data/100k | head

using
pussy
units
funds
virus
sugar
susan
turns
usual
busty


!grep -P '({"|".join(patterns)})' data/100k | wc -l

235


positions = {
    'u': {0, 1, 3, 4} - {0},
    's': {0, 1, 2, 4} - {1},
    'g': {0, 1, 2, 3}
}

combinations = [g for g in product(*positions.values()) if len(set(g)) == len(g)]


exclude = [['m', 'o', 'e', 'i', 'n'] for _ in range(5)]
for letter, potential_positions in positions.items():
    for non_position in {0, 1, 2, 3, 4} - potential_positions:
        exclude[non_position].append(letter)

exclude = [f"[^{''.join(p)}]" for p in exclude]
exclude

['[^moeinu]', '[^moeins]', '[^moeinu]', '[^moeins]', '[^moeing]']


patterns = []
for u, s, g in combinations:
    pattern = exclude.copy()
    pattern[u] = 'u'
    pattern[s] = 's'
    pattern[g] = 'g'
    patterns.append(''.join(pattern))
patterns

['sug[^moeins][^moeing]',
 'su[^moeinu]g[^moeing]',
 'gus[^moeins][^moeing]',
 '[^moeinu]usg[^moeing]',
 'gu[^moeinu][^moeins]s',
 '[^moeinu]ug[^moeins]s',
 '[^moeinu]u[^moeinu]gs',
 'sg[^moeinu]u[^moeing]',
 's[^moeins]gu[^moeing]',
 'g[^moeins]su[^moeing]',
 '[^moeinu]gsu[^moeing]',
 'g[^moeins][^moeinu]us',
 '[^moeinu]g[^moeinu]us',
 '[^moeinu][^moeins]gus',
 'sg[^moeinu][^moeins]u',
 's[^moeins]g[^moeins]u',
 's[^moeins][^moeinu]gu',
 'g[^moeins]s[^moeins]u',
 '[^moeinu]gs[^moeins]u',
 '[^moeinu][^moeins]sgu']


!grep -P '({"|".join(patterns)})' data/100k | nl

     1	sugar
     2	argus
     3	gurus
     4	gusts
     5	juggs
     6	gulls
     7	gurps
     8	gyrus
     9	gusta
    10	dysgu
    11	gusty
    12	suggs
    13	vagus

Solving Wordle using Regex (and a little bit of Python)¶

Give Me the Words¶

Let the Game Begin¶

A More Interesting Example¶

Epilogue¶