Documentation update, compare against stdlib

ijl · Nov 23, 2024 · ded52a7 · ded52a7
1 parent f53ec9f
commit ded52a7
Show file tree

Hide file tree

Showing 18 changed files with 119 additions and 474 deletions.
diff --git a/README.md b/README.md
diff --git a/bench/data.py b/bench/data.py
@@ -3,39 +3,17 @@
 from json import dumps as _json_dumps
 from json import loads as json_loads
 
-from rapidjson import dumps as _rapidjson_dumps
-from rapidjson import loads as rapidjson_loads
-from simplejson import dumps as _simplejson_dumps
-from simplejson import loads as simplejson_loads
-from ujson import dumps as _ujson_dumps
-from ujson import loads as ujson_loads
-
 from orjson import dumps as orjson_dumps
 from orjson import loads as orjson_loads
 
 
-def ujson_dumps(obj):
-    return _ujson_dumps(obj).encode("utf-8")
-
-
-def rapidjson_dumps(obj):
-    return _rapidjson_dumps(obj).encode("utf-8")
-
-
 def json_dumps(obj):
     return _json_dumps(obj).encode("utf-8")
 
 
-def simplejson_dumps(obj):
-    return _simplejson_dumps(obj).encode("utf-8")
-
-
 libraries = {
     "orjson": (orjson_dumps, orjson_loads),
-    "ujson": (ujson_dumps, ujson_loads),
     "json": (json_dumps, json_loads),
-    "rapidjson": (rapidjson_dumps, rapidjson_loads),
-    "simplejson": (simplejson_dumps, simplejson_loads),
 }
 
 

diff --git a/bench/requirements.txt b/bench/requirements.txt
@@ -1,9 +1,6 @@
-memory-profiler
+memory-profiler; python_version<"3.13"
 pandas; python_version<"3.13"
 pytest-benchmark
 pytest-random-order
-python-rapidjson
 seaborn; python_version<"3.13"
-simplejson
 tabulate
-ujson
diff --git a/bench/run_mem b/bench/run_mem
@@ -19,12 +19,6 @@ if lib_name == "json":
     from json import dumps, loads
 elif lib_name == "orjson":
     from orjson import dumps, loads
-elif lib_name == "rapidjson":
-    from rapidjson import dumps, loads
-elif lib_name == "simplejson":
-    from simplejson import dumps, loads
-elif lib_name == "ujson":
-    from ujson import dumps, loads
 else:
     raise NotImplementedError
 

diff --git a/doc/deserialization.png b/doc/deserialization.png
diff --git a/doc/serialization.png b/doc/serialization.png
diff --git a/integration/requirements.txt b/integration/requirements.txt
@@ -1,3 +1,3 @@
 flask;sys_platform!="win"
 gunicorn;sys_platform!="win"
-httpx==0.24.1;sys_platform!="win"
+httpx==0.27.2;sys_platform!="win"
diff --git a/pyproject.toml b/pyproject.toml
@@ -61,5 +61,5 @@ known-first-party = ["orjson"]
 python_version = "3.8"
 
 [[tool.mypy.overrides]]
-module = ["dateutil", "pytz", "simplejson", "ujson"]
+module = ["dateutil", "pytz"]
 ignore_missing_imports = true
diff --git a/requirements.txt b/requirements.txt
@@ -3,4 +3,4 @@
 -r test/requirements.txt
 maturin
 mypy==1.13.0
-ruff==0.7.1
+ruff==0.8.0
diff --git a/script/graph b/script/graph
@@ -13,7 +13,7 @@ from tabulate import tabulate
 
 import orjson
 
-LIBRARIES = ("orjson", "ujson", "rapidjson", "simplejson", "json")
+LIBRARIES = ("orjson", "json")
 
 
 def aggregate():

diff --git a/script/lint b/script/lint
@@ -2,7 +2,7 @@
 
 set -eou pipefail
 
-to_lint="./bench/*.py ./pysrc/orjson/__init__.pyi ./test/*.py script/pydataclass script/pymem
+to_lint="./bench/*.py ./pysrc/orjson/__init__.pyi ./test/*.py script/pydataclass
 script/pysort script/pynumpy script/pynonstr script/pycorrectness script/graph integration/init
 integration/wsgi.py integration/typestubs.py integration/thread"
 

diff --git a/script/pycorrectness b/script/pycorrectness
@@ -8,23 +8,17 @@ import lzma
 import os
 from pathlib import Path
 
-import rapidjson
-import simplejson
-import ujson
 from tabulate import tabulate
 
 import orjson
 
 dirname = os.path.join(os.path.dirname(__file__), "..", "data")
 
-LIBRARIES = ["orjson", "ujson", "rapidjson", "simplejson", "json"]
+LIBRARIES = ["orjson", "json"]
 
 
 LIBRARY_FUNC_MAP = {
     "orjson": orjson.loads,
-    "ujson": ujson.loads,
-    "rapidjson": rapidjson.loads,
-    "simplejson": simplejson.loads,
     "json": json.loads,
 }
 

diff --git a/script/pydataclass b/script/pydataclass
@@ -8,9 +8,6 @@ import os
 from timeit import timeit
 from typing import List
 
-import rapidjson
-import simplejson
-import ujson
 from tabulate import tabulate
 
 import orjson
@@ -50,7 +47,7 @@ def default(__obj):
 
 headers = ("Library", "dict (ms)", "dataclass (ms)", "vs. orjson")
 
-LIBRARIES = ("orjson", "ujson", "rapidjson", "simplejson", "json")
+LIBRARIES = ("orjson", "json")
 
 ITERATIONS = 100
 
@@ -72,34 +69,6 @@ for lib_name in LIBRARIES:
             lambda: json.dumps(objects_as_dataclass, default=default).encode("utf-8"),
             number=ITERATIONS,
         )
-    elif lib_name == "simplejson":
-        as_dict = timeit(
-            lambda: simplejson.dumps(objects_as_dict).encode("utf-8"),
-            number=ITERATIONS,
-        )
-        as_dataclass = timeit(
-            lambda: simplejson.dumps(objects_as_dataclass, default=default).encode(
-                "utf-8"
-            ),
-            number=ITERATIONS,
-        )
-    elif lib_name == "ujson":
-        as_dict = timeit(
-            lambda: ujson.dumps(objects_as_dict).encode("utf-8"),
-            number=ITERATIONS,
-        )
-        as_dataclass = None
-    elif lib_name == "rapidjson":
-        as_dict = timeit(
-            lambda: rapidjson.dumps(objects_as_dict).encode("utf-8"),
-            number=ITERATIONS,
-        )
-        as_dataclass = timeit(
-            lambda: rapidjson.dumps(objects_as_dataclass, default=default).encode(
-                "utf-8"
-            ),
-            number=ITERATIONS,
-        )
     elif lib_name == "orjson":
         as_dict = timeit(lambda: orjson.dumps(objects_as_dict), number=ITERATIONS)
         as_dataclass = timeit(

diff --git a/script/pyindent b/script/pyindent
@@ -9,9 +9,6 @@ import sys
 from pathlib import Path
 from timeit import timeit
 
-import rapidjson
-import simplejson
-import ujson
 from tabulate import tabulate
 
 import orjson
@@ -37,7 +34,7 @@ data = read_fixture_obj(f"{filename}.json.xz")
 
 headers = ("Library", "compact (ms)", "pretty (ms)", "vs. orjson")
 
-LIBRARIES = ("orjson", "ujson", "rapidjson", "simplejson", "json")
+LIBRARIES = ("orjson", "json")
 
 output_in_kib_compact = len(orjson.dumps(data)) / 1024
 output_in_kib_pretty = len(orjson.dumps(data, option=orjson.OPT_INDENT_2)) / 1024
@@ -73,30 +70,6 @@ for lib_name in LIBRARIES:
             number=ITERATIONS,
         )
         correct = test_correctness(json.dumps(data, indent=2).encode("utf-8"))
-    elif lib_name == "simplejson":
-        time_compact = timeit(
-            lambda: simplejson.dumps(data).encode("utf-8"),
-            number=ITERATIONS,
-        )
-        time_pretty = timeit(
-            lambda: simplejson.dumps(data, indent=2).encode("utf-8"),
-            number=ITERATIONS,
-        )
-        correct = test_correctness(simplejson.dumps(data, indent=2).encode("utf-8"))
-    elif lib_name == "ujson":
-        time_compact = timeit(
-            lambda: ujson.dumps(data).encode("utf-8"),
-            number=ITERATIONS,
-        )
-        time_pretty = timeit(
-            lambda: ujson.dumps(data, indent=2).encode("utf-8"),
-            number=ITERATIONS,
-        )
-        correct = test_correctness(ujson.dumps(data, indent=2).encode("utf-8"))
-    elif lib_name == "rapidjson":
-        time_compact = timeit(lambda: rapidjson.dumps(data), number=ITERATIONS)
-        time_pretty = timeit(lambda: rapidjson.dumps(data, indent=2), number=ITERATIONS)
-        correct = test_correctness(rapidjson.dumps(data, indent=2))
     elif lib_name == "orjson":
         time_compact = timeit(lambda: orjson.dumps(data), number=ITERATIONS)
         time_pretty = timeit(

diff --git a/script/pymem b/script/pymem
diff --git a/script/pynonstr b/script/pynonstr
@@ -9,9 +9,6 @@ import random
 from time import mktime
 from timeit import timeit
 
-import rapidjson
-import simplejson
-import ujson
 from tabulate import tabulate
 
 import orjson
@@ -33,7 +30,7 @@ data_as_str = orjson.loads(orjson.dumps(data_as_obj, option=orjson.OPT_NON_STR_K
 
 headers = ("Library", "str keys (ms)", "int keys (ms)", "int keys sorted (ms)")
 
-LIBRARIES = ("orjson", "ujson", "rapidjson", "simplejson", "json")
+LIBRARIES = ("orjson", "json")
 
 ITERATIONS = 500
 
@@ -69,41 +66,6 @@ for lib_name in LIBRARIES:
             None  # TypeError: '<' not supported between instances of 'str' and 'int'
         )
         correct = False
-    elif lib_name == "simplejson":
-        time_as_str = timeit(
-            lambda: simplejson.dumps(data_as_str).encode("utf-8"),
-            number=ITERATIONS,
-        )
-        time_as_obj = timeit(
-            lambda: simplejson.dumps(data_as_obj).encode("utf-8"),
-            number=ITERATIONS,
-        )
-        time_as_obj_sorted = timeit(
-            lambda: simplejson.dumps(data_as_obj, sort_keys=True).encode("utf-8"),
-            number=ITERATIONS,
-        )
-        correct = test_correctness(
-            simplejson.dumps(data_as_obj, sort_keys=True).encode("utf-8")
-        )
-    elif lib_name == "ujson":
-        time_as_str = timeit(
-            lambda: ujson.dumps(data_as_str).encode("utf-8"),
-            number=ITERATIONS,
-        )
-        time_as_obj = timeit(
-            lambda: ujson.dumps(data_as_obj).encode("utf-8"),
-            number=ITERATIONS,
-        )
-        time_as_obj_sorted = None  # segfault
-        correct = False
-    elif lib_name == "rapidjson":
-        time_as_str = timeit(
-            lambda: rapidjson.dumps(data_as_str).encode("utf-8"),
-            number=ITERATIONS,
-        )
-        time_as_obj = None
-        time_as_obj_sorted = None
-        correct = False
     elif lib_name == "orjson":
         time_as_str = timeit(
             lambda: orjson.dumps(data_as_str, None, orjson.OPT_NON_STR_KEYS),

diff --git a/script/pynumpy b/script/pynumpy
@@ -11,8 +11,6 @@ from timeit import timeit
 
 import numpy
 import psutil
-import rapidjson
-import simplejson
 from memory_profiler import memory_usage
 from tabulate import tabulate
 
@@ -71,7 +69,7 @@ def default(__obj):
 
 headers = ("Library", "Latency (ms)", "RSS diff (MiB)", "vs. orjson")
 
-LIBRARIES = ("orjson", "ujson", "rapidjson", "simplejson", "json")
+LIBRARIES = ("orjson", "json")
 
 ITERATIONS = 10
 
@@ -80,17 +78,6 @@ def orjson_dumps():
     return orjson.dumps(array, option=orjson.OPT_SERIALIZE_NUMPY)
 
 
-ujson_dumps = None
-
-
-def rapidjson_dumps():
-    return rapidjson.dumps(array, default=default).encode("utf-8")
-
-
-def simplejson_dumps():
-    return simplejson.dumps(array, default=default).encode("utf-8")
-
-
 def json_dumps():
     return json.dumps(array, default=default).encode("utf-8")