-
-
Notifications
You must be signed in to change notification settings - Fork 29
[#2089] Updated Solr to v9. #2103
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from all commits
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,185 @@ | ||
| # À => A | ||
| "\u00C0" => "A" | ||
| # Á => A | ||
| "\u00C1" => "A" | ||
| # Â => A | ||
| "\u00C2" => "A" | ||
| # Ã => A | ||
| "\u00C3" => "A" | ||
| # Ä => A | ||
| #"\u00C4" => "A" | ||
| # Å => A | ||
| #"\u00C5" => "A" | ||
| # Ą => A | ||
| "\u0104" => "A" | ||
| # Æ => AE | ||
| "\u00C6" => "AE" | ||
| # Ç => C | ||
| "\u00C7" => "C" | ||
| # Ć => C | ||
| "\U0106" => "C" | ||
| # È => E | ||
| "\u00C8" => "E" | ||
| # É => E | ||
| "\u00C9" => "E" | ||
| # Ê => E | ||
| "\u00CA" => "E" | ||
| # Ë => E | ||
| "\u00CB" => "E" | ||
| # Ę => E | ||
| "\u0118" => "E" | ||
| # Ì => I | ||
| "\u00CC" => "I" | ||
| # Í => I | ||
| "\u00CD" => "I" | ||
| # Î => I | ||
| "\u00CE" => "I" | ||
| # Ï => I | ||
| "\u00CF" => "I" | ||
| # IJ => IJ | ||
| "\u0132" => "IJ" | ||
| # Ð => D | ||
| "\u00D0" => "D" | ||
| # Ł => L | ||
| "\u0141" => "L" | ||
| # Ñ => N | ||
| "\u00D1" => "N" | ||
| # Ń => N | ||
| "\u0143" => "N" | ||
| # Ò => O | ||
| "\u00D2" => "O" | ||
| # Ó => O | ||
| "\u00D3" => "O" | ||
| # Ô => O | ||
| "\u00D4" => "O" | ||
| # Õ => O | ||
| "\u00D5" => "O" | ||
| # Ö => O | ||
| #"\u00D6" => "O" | ||
| # Ø => O | ||
| "\u00D8" => "O" | ||
| # Œ => OE | ||
| "\u0152" => "OE" | ||
| # Þ | ||
| "\u00DE" => "TH" | ||
| # Ù => U | ||
| "\u00D9" => "U" | ||
| # Ú => U | ||
| "\u00DA" => "U" | ||
| # Û => U | ||
| "\u00DB" => "U" | ||
| # Ü => U | ||
| "\u00DC" => "U" | ||
| # Ý => Y | ||
| "\u00DD" => "Y" | ||
| # Ÿ => Y | ||
| "\u0178" => "Y" | ||
| # à => a | ||
| "\u00E0" => "a" | ||
| # á => a | ||
| "\u00E1" => "a" | ||
| # â => a | ||
| "\u00E2" => "a" | ||
| # ã => a | ||
| "\u00E3" => "a" | ||
| # ä => a | ||
| #"\u00E4" => "a" | ||
| # å => a | ||
| #"\u00E5" => "a" | ||
| # æ => ae | ||
| "\u00E6" => "ae" | ||
| # ç => c | ||
| "\u00E7" => "c" | ||
| # è => e | ||
| "\u00E8" => "e" | ||
| # é => e | ||
| "\u00E9" => "e" | ||
| # ê => e | ||
| "\u00EA" => "e" | ||
| # ë => e | ||
| "\u00EB" => "e" | ||
| # ì => i | ||
| "\u00EC" => "i" | ||
| # í => i | ||
| "\u00ED" => "i" | ||
| # î => i | ||
| "\u00EE" => "i" | ||
| # ï => i | ||
| "\u00EF" => "i" | ||
| # ij => ij | ||
| "\u0133" => "ij" | ||
| # ð => d | ||
| "\u00F0" => "d" | ||
| # ñ => n | ||
| "\u00F1" => "n" | ||
| # ò => o | ||
| "\u00F2" => "o" | ||
| # ó => o | ||
| "\u00F3" => "o" | ||
| # ô => o | ||
| "\u00F4" => "o" | ||
| # õ => o | ||
| "\u00F5" => "o" | ||
| # ö => o | ||
| #"\u00F6" => "o" | ||
| # ø => o | ||
| "\u00F8" => "o" | ||
| # œ => oe | ||
| "\u0153" => "oe" | ||
| # ß => ss | ||
| "\u00DF" => "ss" | ||
| # Ś => S | ||
| "\u015a" => "S" | ||
| # þ => th | ||
| "\u00FE" => "th" | ||
| # ù => u | ||
| "\u00F9" => "u" | ||
| # ú => u | ||
| "\u00FA" => "u" | ||
| # û => u | ||
| "\u00FB" => "u" | ||
| # ü => u | ||
| "\u00FC" => "u" | ||
| # ý => y | ||
| "\u00FD" => "y" | ||
| # ÿ => y | ||
| "\u00FF" => "y" | ||
| # Ź => Z | ||
| "\u0179" => "Z" | ||
| # Ż => Z | ||
| "\u017b" => "Z" | ||
| # ff => ff | ||
| "\uFB00" => "ff" | ||
| # fi => fi | ||
| "\uFB01" => "fi" | ||
| # fl => fl | ||
| "\uFB02" => "fl" | ||
| # ffi => ffi | ||
| "\uFB03" => "ffi" | ||
| # ffl => ffl | ||
| "\uFB04" => "ffl" | ||
| # ſt => st | ||
| "\uFB05" => "st" | ||
| # st => st | ||
| "\uFB06" => "st" | ||
| # Māori macrons. | ||
| # Ā => A | ||
| "\u0100" => "A" | ||
| # Ē => E | ||
| "\u0112" => "E" | ||
| # Ī => I | ||
| "\u012A" => "I" | ||
| # Ō => O | ||
| "\u014C" => "O" | ||
| # Ū => U | ||
| "\u016A" => "U" | ||
| # ā => a | ||
| "\u0101" => "a" | ||
| # ē => e | ||
| "\u0113" => "e" | ||
| # ī => i | ||
| "\u012B" => "i" | ||
| # ō => o | ||
| "\u014D" => "o" | ||
| # ū => u | ||
| "\u016B" => "u" | ||
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1 @@ | ||
|
|
||
|
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. 🧩 Analysis chainEmpty file—verify intent and populate if needed. The file is created as part of Estonian linguistic resources for Solr 9 language support but contains no content. Clarify whether this is:
Given that related linguistic files ( 🏁 Script executed: #!/bin/bash
# Check content and size of nouns_et.txt
echo "=== Checking nouns_et.txt ==="
if [ -f ".docker/config/solr/config-set/nouns_et.txt" ]; then
echo "File exists"
echo "File size: $(wc -c < .docker/config/solr/config-set/nouns_et.txt) bytes"
echo "Line count: $(wc -l < .docker/config/solr/config-set/nouns_et.txt) lines"
echo "Content (hex dump):"
od -c .docker/config/solr/config-set/nouns_et.txt | head -5
else
echo "File does not exist"
fi
# Check related Estonian language files
echo -e "\n=== Checking related Estonian files ==="
for file in stopwords_et.txt synonyms_et.txt; do
path=".docker/config/solr/config-set/$file"
if [ -f "$path" ]; then
echo "File: $file - Size: $(wc -c < $path) bytes, Lines: $(wc -l < $path) lines"
echo "First 3 lines:"
head -3 "$path" || true
else
echo "$file: Not found"
fi
done
# Search for references to nouns_et in configuration
echo -e "\n=== Searching for references to nouns_et ==="
rg -i "nouns_et" .docker/config/solr/config-set/ -A2 -B2 || echo "No references found"
# Check schema for Estonian language configuration
echo -e "\n=== Checking schema for Estonian references ==="
if [ -f ".docker/config/solr/config-set/managed-schema.xml" ]; then
rg -i "et|estonia" .docker/config/solr/config-set/managed-schema.xml -C2 || echo "No Estonian references found"
else
find .docker/config/solr/config-set/ -name "*.xml" | head -5 | xargs grep -i "estonia\|nouns" || true
fi
# List all files in the config-set directory to understand structure
echo -e "\n=== Files in config-set directory ==="
find .docker/config/solr/config-set/ -type f | sortLength of output: 13810 Populate The file is currently empty (1 byte) but is actively referenced in Related Estonian files ( |
||
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1 @@ | ||
|
|
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Fix Unicode escape sequence syntax error on line 20.
Line 20 uses uppercase
\U0106but the correct syntax is lowercase\u0106. The uppercase variant is not valid for 4-digit hex escape sequences in most text processing contexts (including Solr's accent mapping configuration). This will cause a parsing error when Solr loads this configuration file.Apply this diff to fix the error:
📝 Committable suggestion
🤖 Prompt for AI Agents