-
Notifications
You must be signed in to change notification settings - Fork 6
/
Copy pathPatternManager.cs
230 lines (190 loc) · 7.86 KB
/
PatternManager.cs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
using Newtonsoft.Json;
using System.Text.RegularExpressions;
namespace WordleReverseSolver
{
internal class PatternData
{
// Number of time it was found in tweets
public int IncidenceCount { get; set; }
// ID of some tweet that contains this pattern
public string SampleTweetId { get; set; }
}
internal class PatternManager: ICloneable
{
const int WordLength = 5;
// Black and gray are alternative that mean the same thing
const char black = (char)0x2B1B;
const char gray = (char)0x2B1C;
const char yellowGreenFirstChar = (char)0xD83D;
const char yellowSecondChar = (char)0xDFE8;
const char greenSecondChar = (char)0xDFE9;
const int allCorrectPattern = 242; // All 2s, so 3^5-1
Dictionary<int, PatternData> _patterns = new Dictionary<int, PatternData>();
public int TweetCount { get; private set; }
private PatternManager() { }
async public static Task<PatternManager> ReadFromTwitter(int puzzleNumber)
{
var manager = new PatternManager();
var twitterSearch = new TwitterSearchService();
string? nextToken = null;
for (int page = 0; page < 100; page++)
{
var query = $"?query=%22Wordle {puzzleNumber}%22 -RT";
if (nextToken != null) query += $"&next_token={nextToken}";
var res = await twitterSearch.GetData(query);
dynamic twitterResponse = JsonConvert.DeserializeObject(res);
nextToken = twitterResponse.meta.next_token;
foreach (var tweet in twitterResponse.data)
{
//Console.WriteLine(tweet.id);
try
{
manager.ParseTweetText((string)tweet.id, (string)tweet.text, puzzleNumber);
}
catch (Exception ex)
{
Console.WriteLine($"Failed to process tweet {tweet.id}: { ex.Message}");
}
manager.TweetCount++;
}
if (nextToken == null || manager._patterns.Count > 100) break;
}
return manager;
}
public bool RemovePattern(int[] patternArray)
{
int patternInteger = PatternArrayToSingleInteger(patternArray);
return _patterns.Remove(patternInteger);
}
public int Count { get { return _patterns.Count; } }
public int GetTotalPatternIncidenceCount()
{
int totalIncidenceCount = 0;
foreach (var pattern in _patterns)
{
totalIncidenceCount += pattern.Value.IncidenceCount;
}
return totalIncidenceCount;
}
void ParseTweetText(string tweetId, string tweetText, int puzzleNumber)
{
int tweetTextIndex = tweetText.IndexOf($"Wordle {puzzleNumber} ", StringComparison.InvariantCultureIgnoreCase);
// Bail out if it doesn't seem to relate to this puzzle number
if (tweetTextIndex < 0)
{
//Console.WriteLine($"Not a tweet for this puzzle: {tweetId}");
return;
};
var bannedRegexes = new string[] {
"http://", // Links are often a sign of some non-English Wordle, e.g. wordle.at
"https://",
"[\u3040-\u30ff\u3400-\u4dbf\u4e00-\u9fff\uf900-\ufaff\uff66-\uff9f]", // Japanese/Chinese characters
"[\u0600-\u06ff]|[\u0750-\u077f]|[\ufb50-\ufc3f]|[\ufe70-\ufefc]", // Arabic characters
@"\p{IsCyrillic}" // Russian characters
};
foreach (var bannedRegex in bannedRegexes)
{
if (Regex.IsMatch(tweetText, bannedRegex))
{
Console.WriteLine($"Ignoring tweet {tweetId} which contains banned regex '{bannedRegex}'");
return;
}
}
//tweetText.IndexOfAny()
for (; ; )
{
int[] pattern = new int[WordLength];
int patternIndex = 0;
tweetTextIndex = tweetText.IndexOfAny(new char[] { black, gray, yellowGreenFirstChar }, tweetTextIndex);
if (tweetTextIndex < 0) return;
for (; patternIndex < WordLength; tweetTextIndex++)
{
if (tweetText[tweetTextIndex] == black || tweetText[tweetTextIndex] == gray)
{
pattern[patternIndex++] = 0;
}
else if (tweetText[tweetTextIndex] == yellowGreenFirstChar)
{
tweetTextIndex++;
if (tweetText[tweetTextIndex] == yellowSecondChar)
{
pattern[patternIndex++] = 1;
}
else if (tweetText[tweetTextIndex] == greenSecondChar)
{
pattern[patternIndex++] = 2;
}
else
{
//Console.WriteLine($"Invalid pattern char in tweet {tweetId} at index {tweetTextIndex}: {(int)tweetText[tweetTextIndex]}");
return;
}
}
else if (tweetText[tweetTextIndex] == 0xFE0F)
{
// Sometimes we get this character between real ones. Maybe some kind of space? Ignore it
}
else
{
//Console.WriteLine($"Invalid pattern char in tweet {tweetId} at index {tweetTextIndex}: {(int)tweetText[tweetTextIndex]}");
return;
}
}
// Last line with all correct, so no need to look further
if (AddPattern(pattern, tweetId) == allCorrectPattern) return;
}
}
private int AddPattern(int[] patternArray, string tweetId)
{
int integerPattern = PatternArrayToSingleInteger(patternArray);
if (!_patterns.ContainsKey(integerPattern))
{
_patterns[integerPattern] = new PatternData { SampleTweetId = tweetId };
}
_patterns[integerPattern].IncidenceCount++;
return integerPattern;
}
internal void DumpAllPatterns()
{
foreach (var entry in _patterns)
{
Console.Write($"{entry.Value.SampleTweetId} ({entry.Value.IncidenceCount}): ");
DumpPattern(SingleIntegerToArrayPattern(entry.Key));
}
}
static int PatternArrayToSingleInteger(int[] patternArray)
{
int num = 0;
for (int i = 0; i < patternArray.Length; i++)
{
num *= 3;
num += patternArray[i];
}
return num;
}
static int[] SingleIntegerToArrayPattern(int integerPattern)
{
var patternArray = new int[WordLength];
for (int i = WordLength-1; i >= 0; i--)
{
patternArray[i] = integerPattern % 3;
integerPattern /= 3;
}
return patternArray;
}
static void DumpPattern(int[] patternArray)
{
for (int i = 0; i < patternArray.Length; i++)
{
Console.Write(patternArray[i]);
}
Console.WriteLine();
}
public object Clone()
{
var manager = new PatternManager();
manager._patterns = new Dictionary<int, PatternData>(_patterns);
return manager;
}
}
}