97 lines
		
	
	
		
			3.5 KiB
		
	
	
	
		
			Python
		
	
	
		
			Executable File
		
	
	
			
		
		
	
	
			97 lines
		
	
	
		
			3.5 KiB
		
	
	
	
		
			Python
		
	
	
		
			Executable File
		
	
	
| #!/usr/bin/python3
 | |
| 
 | |
| # Copyright 2020 Google LLC
 | |
| #
 | |
| # Licensed under the Apache License, Version 2.0 (the "License");
 | |
| # you may not use this file except in compliance with the License.
 | |
| # You may obtain a copy of the License at
 | |
| #
 | |
| #      http://www.apache.org/licenses/LICENSE-2.0
 | |
| #
 | |
| # Unless required by applicable law or agreed to in writing, software
 | |
| # distributed under the License is distributed on an "AS IS" BASIS,
 | |
| # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | |
| # See the License for the specific language governing permissions and
 | |
| # limitations under the License.
 | |
| """ An example native JSON vs uJSON differential fuzzer.
 | |
| 
 | |
| This fuzzer looks for differences between the built-in json library and the
 | |
| native ujson library. The ujson library should be built for coverage (see
 | |
| build_install_ujson.sh), and the Python fuzzer should be executed under ASAN.
 | |
| As an example:
 | |
|     LD_PRELOAD="/usr/lib/llvm-9/lib/clang/9.0.1/lib/linux/libclang_rt.asan-x86_64.so
 | |
|     $(python3 -c "import atheris; print(atheris.path())")" python3
 | |
|     ./json_differential_fuzzer.py -detect_leaks=0
 | |
| 
 | |
| This fuzzer has found a bug with inconsistent handling of integers with
 | |
| too-high magnitude. uJSON sometimes refuses to process numbers that are too far
 | |
| from 0 with "Value is too big!" or the equivalent for values that are too
 | |
| negative. However, other times it happily processes them with two's compliment
 | |
| mod. As an example, it refuses to parse "-9223372036854775809" (the first
 | |
| integer not representable in a 64-bit signed number) with "Value is too small";
 | |
| but it will happily parse "-80888888888888888888", a significantly more negative
 | |
| number. However, it parses it as -9223372036854775808. The JSON spec
 | |
| (https://tools.ietf.org/html/rfc7159#section-6) "allows implementations to set
 | |
| limits on the range and precision of numbers accepted", so failing to parse
 | |
| values that are too big or too small is techincally fine; however,
 | |
| misinterpreting them is not.
 | |
| """
 | |
| 
 | |
| import atheris
 | |
| import sys
 | |
| 
 | |
| with atheris.instrument_imports():
 | |
|   import json
 | |
|   import ujson
 | |
| 
 | |
| 
 | |
| @atheris.instrument_func
 | |
| def ClearAllIntegers(data):
 | |
|   """Used to prevent known bug; sets all integers in data recursively to 0."""
 | |
|   if type(data) == int:
 | |
|     return 0
 | |
|   if type(data) == list:
 | |
|     for i in range(0, len(data)):
 | |
|       data[i] = ClearAllIntegers(data[i])
 | |
|   if type(data) == dict:
 | |
|     for k, v in data:
 | |
|       data[k] = ClearAllIntegers(v)
 | |
|   return data
 | |
| 
 | |
| 
 | |
| @atheris.instrument_func
 | |
| def TestOneInput(input_bytes):
 | |
|   fdp = atheris.FuzzedDataProvider(input_bytes)
 | |
|   original = fdp.ConsumeUnicode(sys.maxsize)
 | |
| 
 | |
|   try:
 | |
|     ujson_data = ujson.loads(original)
 | |
|     json_data = json.loads(original)
 | |
|   except Exception as e:
 | |
|     # It would be interesting to enforce that if one of the libraries throws an
 | |
|     # exception, the other does too. However, uJSON accepts many invalid inputs
 | |
|     # that are uninteresting, such as "00". So, that is not done.
 | |
|     return
 | |
| 
 | |
|   # Uncomment these lines to ignore the errors described in the docstring of
 | |
|   # this file.
 | |
|   # json_data = ClearAllIntegers(json_data)
 | |
|   # ujson_data = ClearAllIntegers(ujson_data)
 | |
| 
 | |
|   json_dumped = json.dumps(json_data)
 | |
|   ujson_dumped = json.dumps(ujson_data)
 | |
| 
 | |
|   if json_dumped != ujson_dumped:
 | |
|     raise RuntimeError(
 | |
|         "Decoding/encoding disagreement!\nInput: %s\nJSON data: %s\nuJSON data: %s\nJSON-dumped: %s\nuJSON-dumped: %s\n"
 | |
|         % (original, json_data, ujson_data, json_dumped, ujson_dumped))
 | |
| 
 | |
| 
 | |
| def main():
 | |
|   atheris.Setup(sys.argv, TestOneInput)
 | |
|   atheris.Fuzz()
 | |
| 
 | |
| 
 | |
| if __name__ == "__main__":
 | |
|   main()
 |