Skip to content

fix: remove duplicate characters caused by fake bold rendering in PDFs #396

fix: remove duplicate characters caused by fake bold rendering in PDFs

fix: remove duplicate characters caused by fake bold rendering in PDFs #396

Workflow file for this run

name: Codeflash Optimization
on:
pull_request:
paths:
- 'unstructured/**'
workflow_dispatch:
concurrency:
group: ${{ github.workflow }}-${{ github.ref }}
cancel-in-progress: true
jobs:
optimize:
name: Optimize new Python code
if: ${{ github.actor != 'codeflash-ai[bot]' }}
runs-on: ubuntu-latest
env:
NLTK_DATA: ${{ github.workspace }}/nltk_data
steps:
- uses: actions/checkout@v4
with:
fetch-depth: 0
- name: 🐍 Set up Python 3.12
uses: actions/setup-python@v5
with:
python-version: 3.12
- name: 📦 Install Environment
uses: ./.github/actions/base-cache
with:
python-version: 3.12
- name: Install system dependencies
run: |
sudo apt-get update
sudo apt-get install -y libmagic-dev poppler-utils libreoffice
sudo add-apt-repository -y ppa:alex-p/tesseract-ocr5
sudo apt-get update
sudo apt-get install -y tesseract-ocr tesseract-ocr-kor
- name: Codeflash Optimization
env:
UNS_API_KEY: ${{ secrets.UNS_API_KEY }}
CODEFLASH_API_KEY: ${{ secrets.CODEFLASH_API_KEY }}
run: uvx codeflash