Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
15 changes: 12 additions & 3 deletions .github/workflows/update_scribe_data.yml
Original file line number Diff line number Diff line change
Expand Up @@ -43,15 +43,15 @@ jobs:
- name: Checkout repository
uses: actions/checkout@v4

- name: Set up Python 3.11
- name: Set up Python 3.12
uses: actions/setup-python@v4
with:
python-version: "3.11"
python-version: "3.12"

- name: Install system dependencies
run: |
sudo apt-get update
sudo apt-get install -y curl git sqlite3 make
sudo apt-get install -y curl git sqlite3 make libicu-dev pkg-config g++ python3-dev

- name: Make script executable
run: chmod +x ./update_data.sh
Expand All @@ -60,6 +60,15 @@ jobs:
id: run_script
run: ./update_data.sh true

- name: Verify SQLite output
run: |
DB="./packs/sqlite/ENLanguageData.sqlite"
echo "Tables in $DB:"
sqlite3 "$DB" ".tables"
echo ""
echo "Sample row from emoji_keywords:"
sqlite3 "$DB" "SELECT * FROM emoji_keywords LIMIT 1;"

- name: Create deployment package
run: |
if [ ! -d "./packs/sqlite" ]; then
Expand Down
9 changes: 8 additions & 1 deletion update_data.sh
Original file line number Diff line number Diff line change
Expand Up @@ -17,7 +17,7 @@ PROJECT_ROOT=$(pwd)

# Define target languages and data types.
TARGET_LANGUAGES=("english" "french" "german" "italian" "spanish" "portuguese" "russian" "swedish")
DATA_TYPES=("nouns" "verbs")
DATA_TYPES=("nouns" "verbs" "emoji_keywords")

RED='\033[0;31m'
GREEN='\033[0;32m'
Expand Down Expand Up @@ -130,6 +130,13 @@ pip install -e . || {
}
success "Dependencies installed successfully"

log "🔧 Building PyICU from source against local ICU..."
pip install --force-reinstall --no-binary :all: PyICU || {
error "Failed to build PyICU from source"
exit 1
}
success "PyICU built from source successfully"

# MARK: Download Wikidata Dump First

DUMP_DIR="./scribe_data_wikidata_dumps_export"
Expand Down