Skip to content
This repository was archived by the owner on Apr 15, 2024. It is now read-only.
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
34 commits
Select commit Hold shift + click to select a range
f478422
.gitignore
kakann Aug 30, 2022
d88aafd
added python action for automatic testing
kakann Aug 30, 2022
00b775a
changed unittest to unittest2
kakann Aug 30, 2022
de68dc9
removed extra flake8
kakann Aug 30, 2022
a53eb9b
created a requirements file
dakaza98 Aug 31, 2022
f9df9a0
migrate things to python 3
dakaza98 Aug 31, 2022
1d8140a
Merge pull request #1 from kakann/fix/python3-fixes
ghmo2789 Sep 1, 2022
fbee832
refactored some files
ghmo2789 Sep 2, 2022
d6f1a4e
moved tests for arfour, ascii85 and lzw
kakann Sep 2, 2022
495255f
Reformatet the files according to pep8
ghmo2789 Sep 3, 2022
c177f18
Add macOS created files in gitignore
ghmo2789 Sep 3, 2022
ee2a2e4
refactored the mapps
ghmo2789 Sep 6, 2022
f53a7f6
Fixed not module found error
ghmo2789 Sep 6, 2022
5f116cf
moved
amermsl92 Sep 6, 2022
32f926a
Autoformatteded half of all files
dakaza98 Sep 6, 2022
a55af9a
moved tests to tests folder Co-authored-by: Danel Arias <DanelArias-D…
dakaza98 Sep 6, 2022
c9a96b1
use argparse in pdf2txt Co-authored-by: Danel Arias <DanelArias-Dre…
dakaza98 Sep 6, 2022
2764d1e
formatted tools folder
dakaza98 Sep 6, 2022
4bb142b
can run test with make file
ghmo2789 Sep 7, 2022
f0a5e8d
Merge branch 'test_refactoring1' of https://github.com/kakann/pdfmine…
ghmo2789 Sep 7, 2022
3eac145
Formatting and fixing flake8 linting errors
DanelArias-Dreyton257 Sep 7, 2022
8e8b0a0
Add actions to all branches
DanelArias-Dreyton257 Sep 7, 2022
4444f10
Adding all branches to github actions
DanelArias-Dreyton257 Sep 7, 2022
7984161
added tests for pdf2txt
dakaza98 Sep 7, 2022
7b06f0e
Restoring the branches
DanelArias-Dreyton257 Sep 7, 2022
0487554
Restoring the branches
DanelArias-Dreyton257 Sep 7, 2022
f7fccc3
new_changes
amermsl92 Sep 7, 2022
8bdc488
Merge pull request #2 from kakann/fix/doubleD
ghmo2789 Sep 8, 2022
a3e7c7e
Merge with reformate_flak8 and solved conflic
ghmo2789 Sep 8, 2022
17e9a5e
Merge branch 'test_refactoring1' of https://github.com/kakann/pdfmine…
ghmo2789 Sep 8, 2022
1e4897d
Solved conflict
ghmo2789 Sep 8, 2022
07353ae
replaced getopt with argparser
ghmo2789 Sep 8, 2022
83529ab
Moved url function from pdf2html into separate module
ghmo2789 Sep 8, 2022
d5da2af
add_documentation
amermsl92 Sep 8, 2022
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
7 changes: 7 additions & 0 deletions .flake8
Original file line number Diff line number Diff line change
@@ -0,0 +1,7 @@
[flake8]
exclude =
# Never scan the git folder
.git,
cmaprsrc/*
docs/*
venv/*
39 changes: 39 additions & 0 deletions .github/workflows/python-app.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,39 @@
# This workflow will install Python dependencies, run tests and lint with a single version of Python
# For more information see: https://help.github.com/actions/language-and-framework-guides/using-python-with-github-actions

name: Python application

on:
push:
branches: ['master']
pull_request:
branches: ['master']

permissions:
contents: read

jobs:
build:

runs-on: ubuntu-latest

steps:
- uses: actions/checkout@v3
- name: Set up Python 3.9
uses: actions/setup-python@v3
with:
python-version: "3.9"
- name: Install dependencies
run: |
python -m pip install --upgrade pip
pip install flake8 unittest2
if [ -f requirements.txt ]; then pip install -r requirements.txt; fi
- name: Lint with flake8
run: |
# stop the build if there are Python syntax errors or undefined names
flake8 . #--count --show-source --statistics
# exit-zero treats all errors as warnings. The GitHub editor is 127 chars wide
flake8 . --count --exit-zero --max-complexity=10 --max-line-length=127 --statistics
- name: Test with unittest2
run: |
unittest2
166 changes: 166 additions & 0 deletions .gitignore
Original file line number Diff line number Diff line change
@@ -0,0 +1,166 @@
# Byte-compiled / optimized / DLL files
__pycache__/
*.py[cod]
*$py.class

# C extensions
*.so

# Distribution / packaging
.Python
build/
develop-eggs/
dist/
downloads/
eggs/
.eggs/
lib/
lib64/
parts/
sdist/
var/
wheels/
share/python-wheels/
*.egg-info/
.installed.cfg
*.egg
MANIFEST

# PyInstaller
# Usually these files are written by a python script from a template
# before PyInstaller builds the exe, so as to inject date/other infos into it.
*.manifest
*.spec

# Installer logs
pip-log.txt
pip-delete-this-directory.txt

# Unit test / coverage reports
htmlcov/
.tox/
.nox/
.coverage
.coverage.*
.cache
nosetests.xml
coverage.xml
*.cover
*.py,cover
.hypothesis/
.pytest_cache/
cover/

# Translations
*.mo
*.pot

# Django stuff:
*.log
local_settings.py
db.sqlite3
db.sqlite3-journal

# Flask stuff:
instance/
.webassets-cache

# Scrapy stuff:
.scrapy

# Sphinx documentation
docs/_build/

# PyBuilder
.pybuilder/
target/

# Jupyter Notebook
.ipynb_checkpoints

# IPython
profile_default/
ipython_config.py

# pyenv
# For a library or package, you might want to ignore these files since the code is
# intended to run in multiple environments; otherwise, check them in:
# .python-version

# pipenv
# According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
# However, in case of collaboration, if having platform-specific dependencies or dependencies
# having no cross-platform support, pipenv may install dependencies that don't work, or not
# install all needed dependencies.
#Pipfile.lock

# poetry
# Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
# This is especially recommended for binary packages to ensure reproducibility, and is more
# commonly ignored for libraries.
# https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
#poetry.lock

# pdm
# Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
#pdm.lock
# pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
# in version control.
# https://pdm.fming.dev/#use-with-ide
.pdm.toml

# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
__pypackages__/

# Celery stuff
celerybeat-schedule
celerybeat.pid

# SageMath parsed files
*.sage.py

# Environments
.env
.venv
env/
venv/
ENV/
env.bak/
venv.bak/

# Spyder project settings
.spyderproject
.spyproject

# Rope project settings
.ropeproject

# mkdocs documentation
/site

# mypy
.mypy_cache/
.dmypy.json
dmypy.json

# Pyre type checker
.pyre/

# pytype static type analyzer
.pytype/

# Cython debug symbols
cython_debug/

# PyCharm
# JetBrains specific template is maintained in a separate JetBrains.gitignore that can
# be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
# and can be added to the global gitignore or merged into this file. For a more nuclear
# option (not recommended) you can uncomment the following to ignore the entire idea folder.
#.idea/

.vscode/

# Files by Github in MacOS
.DS_Store
.idea/
3 changes: 3 additions & 0 deletions .idea/.gitignore

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

22 changes: 13 additions & 9 deletions Makefile
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,7 @@ TWINE=twine
RM=rm -f
CP=cp -f
MKDIR=mkdir
PYTHON3 = python3 -m unittest

all:

Expand Down Expand Up @@ -55,12 +56,15 @@ $(CMAPDST)/to-unicode-Adobe-Korea1.marshal.gz: $(CMAPDST)
$(CONV_CMAP) -c KSC-EUC=euc-kr -c KSC-Johab=johab -c KSCms-UHC=cp949 -c UniKS-UTF8=utf-8 \
$(CMAPDST) Adobe-Korea1 $(CMAPSRC)/cid2code_Adobe_Korea1.txt

test: cmap
$(PYTHON) -m pdfminer.arcfour
$(PYTHON) -m pdfminer.ascii85
$(PYTHON) -m pdfminer.lzw
$(PYTHON) -m pdfminer.rijndael
$(PYTHON) -m pdfminer.runlength
$(PYTHON) -m pdfminer.ccitt
$(PYTHON) -m pdfminer.psparser
cd samples && $(MAKE) test
#test: cmap
# $(PYTHON) -m pdfminer.arcfour
# $(PYTHON) -m pdfminer.ascii85
# $(PYTHON) -m pdfminer.lzw
# $(PYTHON) -m pdfminer.rijndael
# $(PYTHON) -m pdfminer.runlength
# $(PYTHON) -m pdfminer.ccitt
# $(PYTHON) -m pdfminer.psparser
# cd samples && $(MAKE) test

test:
$(PYTHON3) tests/*.py
Loading