@@ -93,40 +93,40 @@ jobs:
9393 brew install poppler tesseract
9494 uv pip install --upgrade pdftotext pytesseract
9595
96- - name : Install pdf2text and ocr dependencies (Windows w/latest Python)
97- # Do full install and testing of pdf2text and ocr only on latest Python version
98- if : ${{ matrix.python-version == '3.14' && runner.os == 'Windows' }}
99- shell : pwsh
100- run : |
101- # Set the preference variable to display Debug messages
102- $VerbosePreference = "Continue"
103-
104- # Install Poppler
105- # 1. install miniconda per https://conda.io/projects/conda/en/stable/user-guide/install/windows.html
106- $condaInstallerUrl = "https://repo.anaconda.com/miniconda/Miniconda3-latest-Windows-x86_64.exe"
107- $condaInstallerPath = "$env:TEMP\Miniconda3-setup.exe"
108- $installDir = "$env:TEMP\Miniconda3"
109- Invoke-WebRequest -Uri $condaInstallerUrl -OutFile $condaInstallerPath
110- # Run the installer silently
111- Start-Process -FilePath $condaInstallerPath -ArgumentList "/RegisterPython=0 /D=$installDir" -Wait -NoNewWindow
112- Remove-Item -Path $condaInstallerPath
113- # 2. install Poppler using conda
114- Start-Process -FilePath "$installDir\conda.exe" -ArgumentList "install -c conda-forge poppler --yes" -Wait -NoNewWindow
115-
116- # Install Tesseract
117- # See https://github.com/UB-Mannheim/tesseract/wiki
118- $tesseractInstallerUrl = "https://github.com/tesseract-ocr/tesseract/releases/download/5.5.0/tesseract-ocr-w64-setup-5.5.0.20241111.exe" # Replace with the latest version
119- $tesseractInstallerPath = "$env:TEMP\tesseract-ocr-setup.exe"
120- Invoke-WebRequest -Uri $tesseractInstallerUrl -OutFile $tesseractInstallerPath
121- # Run the installer silently
122- Start-Process -FilePath $tesseractInstallerPath -ArgumentList "/S /D=C:\Program Files\Tesseract-OCR" -Wait -NoNewWindow
123- Remove-Item -Path $tesseractInstallerPath
124- # Add Tesseract to PATH
125- $env:Path += ";C:\Program Files\Tesseract-OCR"
126- echo "C:\Program Files\Tesseract-OCR" | Out-File -FilePath $env:GITHUB_PATH -Append
127-
128- # Install Python packages
129- uv pip install --upgrade pdftotext pytesseract
96+ # - name: Install pdf2text and ocr dependencies (Windows w/latest Python)
97+ # # Do full install and testing of pdf2text and ocr only on latest Python version
98+ # if: ${{ matrix.python-version == '3.14' && runner.os == 'Windows' }}
99+ # shell: pwsh
100+ # run: |
101+ # # Set the preference variable to display Verbose messages
102+ # $VerbosePreference = "Continue"
103+
104+ # # Install Poppler
105+ # # 1. install miniconda per https://conda.io/projects/conda/en/stable/user-guide/install/windows.html
106+ # $condaInstallerUrl = "https://repo.anaconda.com/miniconda/Miniconda3-latest-Windows-x86_64.exe"
107+ # $condaInstallerPath = "$env:TEMP\Miniconda3-setup.exe"
108+ # $installDir = "$env:TEMP\Miniconda3"
109+ # Invoke-WebRequest -Uri $condaInstallerUrl -OutFile $condaInstallerPath -HttpVersion 2.0
110+ # # Run the installer silently
111+ # Start-Process -FilePath $condaInstallerPath -ArgumentList "/RegisterPython=0 /D=$installDir" -Wait -NoNewWindow
112+ # Remove-Item -Path $condaInstallerPath
113+ # # 2. install Poppler using conda
114+ # Start-Process -FilePath "$installDir\conda.exe" -ArgumentList "install -c conda-forge poppler --yes" -Wait -NoNewWindow
115+
116+ # # Install Tesseract
117+ # # See https://github.com/UB-Mannheim/tesseract/wiki
118+ # $tesseractInstallerUrl = "https://github.com/tesseract-ocr/tesseract/releases/download/5.5.0/tesseract-ocr-w64-setup-5.5.0.20241111.exe" # Replace with the latest version
119+ # $tesseractInstallerPath = "$env:TEMP\tesseract-ocr-setup.exe"
120+ # Invoke-WebRequest -Uri $tesseractInstallerUrl -OutFile $tesseractInstallerPath -HttpVersion 2.0
121+ # # Run the installer silently
122+ # Start-Process -FilePath $tesseractInstallerPath -ArgumentList "/S /D=C:\Program Files\Tesseract-OCR" -Wait -NoNewWindow
123+ # Remove-Item -Path $tesseractInstallerPath
124+ # # Add Tesseract to PATH
125+ # $env:Path += ";C:\Program Files\Tesseract-OCR"
126+ # echo "C:\Program Files\Tesseract-OCR" | Out-File -FilePath $env:GITHUB_PATH -Append
127+
128+ # # Install Python packages
129+ # uv pip install --upgrade pdftotext pytesseract
130130
131131 - name : Install all other dependencies (GIL)
132132 if : ${{ ! endsWith(matrix.python-version, 't') }}
0 commit comments