repo: init
This commit is contained in:
commit
0a431f0bd8
176
.gitignore
vendored
Normal file
176
.gitignore
vendored
Normal file
@ -0,0 +1,176 @@
|
||||
# Created by https://www.toptal.com/developers/gitignore/api/python
|
||||
# Edit at https://www.toptal.com/developers/gitignore?templates=python
|
||||
|
||||
### Python ###
|
||||
# Byte-compiled / optimized / DLL files
|
||||
__pycache__/
|
||||
*.py[cod]
|
||||
*$py.class
|
||||
|
||||
# C extensions
|
||||
*.so
|
||||
|
||||
# Distribution / packaging
|
||||
.Python
|
||||
build/
|
||||
develop-eggs/
|
||||
dist/
|
||||
downloads/
|
||||
eggs/
|
||||
.eggs/
|
||||
lib/
|
||||
lib64/
|
||||
parts/
|
||||
sdist/
|
||||
var/
|
||||
wheels/
|
||||
share/python-wheels/
|
||||
*.egg-info/
|
||||
.installed.cfg
|
||||
*.egg
|
||||
MANIFEST
|
||||
|
||||
# PyInstaller
|
||||
# Usually these files are written by a python script from a template
|
||||
# before PyInstaller builds the exe, so as to inject date/other infos into it.
|
||||
*.manifest
|
||||
*.spec
|
||||
|
||||
# Installer logs
|
||||
pip-log.txt
|
||||
pip-delete-this-directory.txt
|
||||
|
||||
# Unit test / coverage reports
|
||||
htmlcov/
|
||||
.tox/
|
||||
.nox/
|
||||
.coverage
|
||||
.coverage.*
|
||||
.cache
|
||||
nosetests.xml
|
||||
coverage.xml
|
||||
*.cover
|
||||
*.py,cover
|
||||
.hypothesis/
|
||||
.pytest_cache/
|
||||
cover/
|
||||
|
||||
# Translations
|
||||
*.mo
|
||||
*.pot
|
||||
|
||||
# Django stuff:
|
||||
*.log
|
||||
local_settings.py
|
||||
db.sqlite3
|
||||
db.sqlite3-journal
|
||||
|
||||
# Flask stuff:
|
||||
instance/
|
||||
.webassets-cache
|
||||
|
||||
# Scrapy stuff:
|
||||
.scrapy
|
||||
|
||||
# Sphinx documentation
|
||||
docs/_build/
|
||||
|
||||
# PyBuilder
|
||||
.pybuilder/
|
||||
target/
|
||||
|
||||
# Jupyter Notebook
|
||||
.ipynb_checkpoints
|
||||
|
||||
# IPython
|
||||
profile_default/
|
||||
ipython_config.py
|
||||
|
||||
# pyenv
|
||||
# For a library or package, you might want to ignore these files since the code is
|
||||
# intended to run in multiple environments; otherwise, check them in:
|
||||
# .python-version
|
||||
|
||||
# pipenv
|
||||
# According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
|
||||
# However, in case of collaboration, if having platform-specific dependencies or dependencies
|
||||
# having no cross-platform support, pipenv may install dependencies that don't work, or not
|
||||
# install all needed dependencies.
|
||||
#Pipfile.lock
|
||||
|
||||
# poetry
|
||||
# Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
|
||||
# This is especially recommended for binary packages to ensure reproducibility, and is more
|
||||
# commonly ignored for libraries.
|
||||
# https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
|
||||
#poetry.lock
|
||||
|
||||
# pdm
|
||||
# Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
|
||||
#pdm.lock
|
||||
# pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
|
||||
# in version control.
|
||||
# https://pdm.fming.dev/#use-with-ide
|
||||
.pdm.toml
|
||||
|
||||
# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
|
||||
__pypackages__/
|
||||
|
||||
# Celery stuff
|
||||
celerybeat-schedule
|
||||
celerybeat.pid
|
||||
|
||||
# SageMath parsed files
|
||||
*.sage.py
|
||||
|
||||
# Environments
|
||||
.env
|
||||
.venv
|
||||
env/
|
||||
venv/
|
||||
ENV/
|
||||
env.bak/
|
||||
venv.bak/
|
||||
|
||||
# Spyder project settings
|
||||
.spyderproject
|
||||
.spyproject
|
||||
|
||||
# Rope project settings
|
||||
.ropeproject
|
||||
|
||||
# mkdocs documentation
|
||||
/site
|
||||
|
||||
# mypy
|
||||
.mypy_cache/
|
||||
.dmypy.json
|
||||
dmypy.json
|
||||
|
||||
# Pyre type checker
|
||||
.pyre/
|
||||
|
||||
# pytype static type analyzer
|
||||
.pytype/
|
||||
|
||||
# Cython debug symbols
|
||||
cython_debug/
|
||||
|
||||
# PyCharm
|
||||
# JetBrains specific template is maintained in a separate JetBrains.gitignore that can
|
||||
# be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
|
||||
# and can be added to the global gitignore or merged into this file. For a more nuclear
|
||||
# option (not recommended) you can uncomment the following to ignore the entire idea folder.
|
||||
#.idea/
|
||||
|
||||
### Python Patch ###
|
||||
# Poetry local configuration file - https://python-poetry.org/docs/configuration/#local-configuration
|
||||
poetry.toml
|
||||
|
||||
# ruff
|
||||
.ruff_cache/
|
||||
|
||||
# LSP config files
|
||||
pyrightconfig.json
|
||||
|
||||
# End of https://www.toptal.com/developers/gitignore/api/python
|
21
LICENSE
Normal file
21
LICENSE
Normal file
@ -0,0 +1,21 @@
|
||||
MIT License
|
||||
|
||||
Copyright (c) 2024 tretrauit
|
||||
|
||||
Permission is hereby granted, free of charge, to any person obtaining a copy
|
||||
of this software and associated documentation files (the "Software"), to deal
|
||||
in the Software without restriction, including without limitation the rights
|
||||
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
||||
copies of the Software, and to permit persons to whom the Software is
|
||||
furnished to do so, subject to the following conditions:
|
||||
|
||||
The above copyright notice and this permission notice shall be included in all
|
||||
copies or substantial portions of the Software.
|
||||
|
||||
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
||||
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||||
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
||||
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
||||
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
||||
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
||||
SOFTWARE.
|
20
README.md
Normal file
20
README.md
Normal file
@ -0,0 +1,20 @@
|
||||
# asjsonp
|
||||
|
||||
Another simple (and stupid) JSON parser.
|
||||
|
||||
## About
|
||||
|
||||
This implements `.json` as described in RFC 4627, including support for all standard features and some extended features:
|
||||
|
||||
+ Comment support
|
||||
+ NaN, Infinity and -Infinity support (like the standard library)
|
||||
|
||||
## Usage
|
||||
|
||||
## Benchmark
|
||||
|
||||
This is about 10x slower than Python `json` module, so don't expect anything from this module.
|
||||
|
||||
## License
|
||||
|
||||
[MIT](./LICENSE)
|
4
asjsonp/__init__.py
Executable file
4
asjsonp/__init__.py
Executable file
@ -0,0 +1,4 @@
|
||||
from asjsonp.module import loads
|
||||
|
||||
|
||||
__all__ = ["loads"]
|
4
asjsonp/__main__.py
Executable file
4
asjsonp/__main__.py
Executable file
@ -0,0 +1,4 @@
|
||||
from asjsonp.module import loads
|
||||
|
||||
|
||||
print(loads(open("test.json", "r").read()))
|
125
asjsonp/module.py
Executable file
125
asjsonp/module.py
Executable file
@ -0,0 +1,125 @@
|
||||
__all__ = ["loads"]
|
||||
|
||||
|
||||
def js2py(obj: str):
|
||||
"""
|
||||
Convert a JSON string to a Python object.
|
||||
|
||||
This follows the simple approach defined in https://docs.python.org/3/library/json.html#encoders-and-decoders
|
||||
"""
|
||||
if obj == "true":
|
||||
return True
|
||||
elif obj == "false":
|
||||
return False
|
||||
elif obj == "null":
|
||||
return None
|
||||
elif obj == "NaN":
|
||||
return float("nan")
|
||||
elif obj == "Infinity":
|
||||
return float("inf")
|
||||
elif obj == "-Infinity":
|
||||
return float("-inf")
|
||||
elif obj.isnumeric():
|
||||
return int(obj)
|
||||
elif obj.lower().replace(".", "").replace("e", "").replace("-", "").isnumeric():
|
||||
return float(obj)
|
||||
else:
|
||||
raise ValueError(f"Invalid JSON value: {obj}")
|
||||
|
||||
|
||||
def loads(s: str):
|
||||
result: list | dict = []
|
||||
first_open: bool = False
|
||||
multiple_object_root: bool = False
|
||||
parents: list = []
|
||||
current: dict | list = result
|
||||
dict_current_key: str = None
|
||||
dict_reading_value: str = None
|
||||
# Set the value so Pylance can be happy.
|
||||
current_text: str = ""
|
||||
is_reading_string: bool = False
|
||||
# Ignore the rest of the string line if it's a comment
|
||||
prev_char: str = ""
|
||||
ignore_rest: bool = False
|
||||
|
||||
def handle_reading_value():
|
||||
nonlocal dict_reading_value
|
||||
nonlocal dict_current_key
|
||||
if dict_reading_value is not None and dict_reading_value.strip():
|
||||
value = js2py(dict_reading_value)
|
||||
if dict_current_key:
|
||||
current[dict_current_key] = value
|
||||
else:
|
||||
current.append(value)
|
||||
dict_reading_value = None
|
||||
dict_current_key = None
|
||||
|
||||
for char in s:
|
||||
if ignore_rest:
|
||||
if char == "\n":
|
||||
ignore_rest = False
|
||||
elif is_reading_string:
|
||||
# Handle string closing quote
|
||||
if char == '"':
|
||||
is_reading_string = False
|
||||
if isinstance(current, dict):
|
||||
if not dict_current_key:
|
||||
dict_current_key = current_text
|
||||
else:
|
||||
current[dict_current_key] = current_text
|
||||
dict_current_key = None
|
||||
dict_reading_value = None
|
||||
else:
|
||||
current.append(current_text)
|
||||
dict_reading_value = None
|
||||
current_text = ""
|
||||
else:
|
||||
current_text += char
|
||||
# Handle object & array types
|
||||
elif char in ["{", "["]:
|
||||
obj: dict | list
|
||||
match char:
|
||||
case "{":
|
||||
if not first_open:
|
||||
first_open = True
|
||||
obj = {}
|
||||
case "[":
|
||||
if not first_open:
|
||||
first_open = True
|
||||
multiple_object_root = True
|
||||
obj = []
|
||||
if isinstance(current, list):
|
||||
current.append(obj)
|
||||
elif isinstance(current, dict):
|
||||
current[dict_current_key] = obj
|
||||
parents.append(current)
|
||||
# Reference to the current dict
|
||||
if isinstance(current, list):
|
||||
current = current[-1]
|
||||
elif isinstance(current, dict):
|
||||
current = current[dict_current_key]
|
||||
dict_current_key = None
|
||||
# Handle object and array closing bracket
|
||||
elif char in ["}", "]"]:
|
||||
# Switch reference back to the parent dict
|
||||
handle_reading_value()
|
||||
current = parents.pop()
|
||||
# Handle string opening quote
|
||||
elif char == '"':
|
||||
is_reading_string = True
|
||||
current_text = ""
|
||||
elif char == ":":
|
||||
dict_reading_value = ""
|
||||
elif char == ",":
|
||||
handle_reading_value()
|
||||
elif char == "/":
|
||||
if prev_char == "/":
|
||||
ignore_rest = True
|
||||
else:
|
||||
if dict_reading_value is not None:
|
||||
if char.strip():
|
||||
dict_reading_value += char
|
||||
prev_char = char
|
||||
if not multiple_object_root:
|
||||
result = result[0]
|
||||
return result
|
33
benchmark/__main__.py
Normal file
33
benchmark/__main__.py
Normal file
@ -0,0 +1,33 @@
|
||||
import asjsonp
|
||||
import json
|
||||
import time
|
||||
import sys
|
||||
|
||||
|
||||
def test_asjsonp(text: str, count: int):
|
||||
start = time.perf_counter_ns()
|
||||
for _ in range(count):
|
||||
asjsonp.loads(text)
|
||||
end = time.perf_counter_ns()
|
||||
print(f"asjsonp.loads: {(end - start) / (1000 ** 2)}ms")
|
||||
|
||||
|
||||
def test_json(text: str, count: int):
|
||||
start = time.perf_counter_ns()
|
||||
for _ in range(count):
|
||||
json.loads(text)
|
||||
end = time.perf_counter_ns()
|
||||
print(f"json.loads: {(end - start) / (1000 ** 2)}ms")
|
||||
|
||||
|
||||
input_file = "./benchmark/data/api.opensource.org.json"
|
||||
count = 1000
|
||||
for i, arg in enumerate(sys.argv[1:]):
|
||||
if arg == "-i":
|
||||
input_file = sys.argv[i + 2]
|
||||
elif arg == "-c":
|
||||
count = int(sys.argv[i + 2])
|
||||
text = open(input_file, "r").read()
|
||||
print(f"Benchmarking file {input_file} with {count} iterations")
|
||||
test_asjsonp(text, count)
|
||||
test_json(text, count)
|
1
benchmark/data/api.opensource.org.json
Normal file
1
benchmark/data/api.opensource.org.json
Normal file
File diff suppressed because one or more lines are too long
15
pyproject.toml
Executable file
15
pyproject.toml
Executable file
@ -0,0 +1,15 @@
|
||||
[tool.poetry]
|
||||
name = "asjsonp"
|
||||
version = "0.1.0"
|
||||
description = "Another simple JSON parser"
|
||||
authors = ["tretrauit <tretrauit@gmail.com>"]
|
||||
license = "MIT"
|
||||
readme = "README.md"
|
||||
|
||||
[tool.poetry.dependencies]
|
||||
python = "^3.12"
|
||||
|
||||
|
||||
[build-system]
|
||||
requires = ["poetry-core"]
|
||||
build-backend = "poetry.core.masonry.api"
|
27
test.json
Executable file
27
test.json
Executable file
@ -0,0 +1,27 @@
|
||||
{
|
||||
"object": {
|
||||
"ubuntu": 16.04,
|
||||
"gcc": "10",
|
||||
"metadata": null,
|
||||
"another-object": {
|
||||
"oriented": "programming"
|
||||
},
|
||||
"a": "a",
|
||||
"array": [
|
||||
"sparkle",
|
||||
"hanabi",
|
||||
{
|
||||
"chipi": "chapa"
|
||||
},
|
||||
[[[[[[[[[["among us"]]]]]]]]]]
|
||||
]
|
||||
},
|
||||
"cc": "gcc",
|
||||
"glxgears": 123,
|
||||
"chai": "bon",
|
||||
"sparkle-sex": true,
|
||||
"nan": NaN,
|
||||
"-infinity": -Infinity,
|
||||
"infinity": Infinity,
|
||||
"e_number": 123e-123
|
||||
}
|
Loading…
Reference in New Issue
Block a user