161 lines
		
	
	
		
			3.8 KiB
		
	
	
	
		
			C
		
	
	
	
			
		
		
	
	
			161 lines
		
	
	
		
			3.8 KiB
		
	
	
	
		
			C
		
	
	
	
| /*
 | |
|  * Copyright 2021 Google LLC
 | |
|  *
 | |
|  * Licensed under the Apache License, Version 2.0 (the "License");
 | |
|  * you may not use this file except in compliance with the License.
 | |
|  * You may obtain a copy of the License at
 | |
|  *
 | |
|  *      http://www.apache.org/licenses/LICENSE-2.0
 | |
|  *
 | |
|  * Unless required by applicable law or agreed to in writing, software
 | |
|  * distributed under the License is distributed on an "AS IS" BASIS,
 | |
|  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | |
|  * See the License for the specific language governing permissions and
 | |
|  * limitations under the License.
 | |
|  */
 | |
| #include <sys/types.h>
 | |
| #include <stdlib.h>
 | |
| #include <stdio.h>
 | |
| #include <stdint.h>
 | |
| #include <unistd.h>
 | |
| #include "tidybuffio.h"
 | |
| #include "tidy.h"
 | |
| 
 | |
| // All boolean options. These will be set randomly
 | |
| // based on the fuzzer data.
 | |
| TidyOptionId bool_options[] = {
 | |
|   TidyJoinClasses, 
 | |
|   TidyJoinStyles, 
 | |
|   TidyKeepFileTimes, 
 | |
|   TidyKeepTabs, 
 | |
|   TidyLiteralAttribs, 
 | |
|   TidyLogicalEmphasis, 
 | |
|   TidyLowerLiterals, 
 | |
|   TidyMakeBare, 
 | |
|   TidyFixUri, 
 | |
|   TidyForceOutput, 
 | |
|   TidyGDocClean, 
 | |
|   TidyHideComments,
 | |
|   TidyMark, 
 | |
|   TidyXmlTags, 
 | |
|   TidyMakeClean,
 | |
|   TidyAnchorAsName, 
 | |
|   TidyMergeEmphasis, 
 | |
|   TidyMakeBare, 
 | |
|   TidyMetaCharset, 
 | |
|   TidyMuteShow, 
 | |
|   TidyNCR, 
 | |
|   TidyNumEntities, 
 | |
|   TidyOmitOptionalTags, 
 | |
|   TidyPunctWrap, 
 | |
|   TidyQuiet,
 | |
|   TidyQuoteAmpersand,  
 | |
|   TidyQuoteMarks, 
 | |
|   TidyQuoteNbsp, 
 | |
|   TidyReplaceColor, 
 | |
|   TidyShowFilename, 
 | |
|   TidyShowInfo, 
 | |
|   TidyShowMarkup, 
 | |
|   TidyShowMetaChange, 
 | |
|   TidyShowWarnings, 
 | |
|   TidySkipNested, 
 | |
|   TidyUpperCaseTags, 
 | |
|   TidyWarnPropAttrs, 
 | |
|   TidyWord2000, 
 | |
|   TidyWrapAsp, 
 | |
|   TidyWrapAttVals, 
 | |
|   TidyWrapJste, 
 | |
|   TidyWrapPhp, 
 | |
|   TidyWrapScriptlets, 
 | |
|   TidyWrapSection, 
 | |
|   TidyWriteBack,
 | |
| };
 | |
| 
 | |
| void set_option(const uint8_t** data, size_t *size, TidyDoc *tdoc, TidyOptionId tboolID) {
 | |
|   uint8_t decider;
 | |
|   decider = **data;
 | |
|   *data += 1; 
 | |
|   *size -= 1;
 | |
|   if (decider % 2 == 0) tidyOptSetBool( *tdoc, tboolID, yes );
 | |
|   else { tidyOptSetBool( *tdoc, tboolID, no ); }
 | |
| }
 | |
| 
 | |
| int TidyXhtml(const uint8_t* data, size_t size, TidyBuffer* output, TidyBuffer* errbuf) {
 | |
|   uint8_t decider;
 | |
| 
 | |
|   // We need enough data for picking all of the options. One byte per option.
 | |
|   if (size < 5+(sizeof(bool_options)/sizeof(bool_options[0]))) {
 | |
|     return 0;
 | |
|   }
 | |
| 
 | |
|   TidyDoc tdoc = tidyCreate();
 | |
| 
 | |
|   // Decide output format
 | |
|   decider = *data;
 | |
|   data++; size--;
 | |
|   if (decider % 3 == 0) tidyOptSetBool( tdoc, TidyXhtmlOut, yes );
 | |
|   else { tidyOptSetBool( tdoc, TidyXhtmlOut, no ); }
 | |
| 
 | |
|   if (decider % 3 == 1) tidyOptSetBool( tdoc, TidyHtmlOut, yes );
 | |
|   else { tidyOptSetBool( tdoc, TidyHtmlOut, no ); }
 | |
| 
 | |
|   if (decider % 3 == 2) tidyOptSetBool( tdoc, TidyXmlOut, yes );
 | |
|   else { tidyOptSetBool( tdoc, TidyXmlOut, no ); }
 | |
| 
 | |
|   // Set options 
 | |
|   for (int i=0; i < sizeof(bool_options)/sizeof(TidyOptionId); i++) {
 | |
|     set_option(&data, &size, &tdoc, bool_options[i]);
 | |
|   }
 | |
| 
 | |
|   // Set an error buffer.
 | |
|   tidySetErrorBuffer(tdoc, errbuf);
 | |
| 
 | |
|   // Parse the data
 | |
|   decider = *data;
 | |
|   data++; size--;
 | |
|   switch (decider % 2) {
 | |
|     case 0: {
 | |
|       char filename[256];
 | |
|       sprintf(filename, "/tmp/libfuzzer.%d", getpid());
 | |
| 
 | |
|       FILE *fp = fopen(filename, "wb");
 | |
|       if (!fp) {
 | |
|           return 0;
 | |
|       }
 | |
|       fwrite(data, size, 1, fp);
 | |
|       fclose(fp);
 | |
| 
 | |
|       tidyParseFile(tdoc, filename);
 | |
|       unlink(filename);
 | |
|     }
 | |
|     break;
 | |
|     case 1: {
 | |
|       char *inp = malloc(size+1);
 | |
|       inp[size] = '\0';
 | |
|       memcpy(inp, data, size);
 | |
|       tidyParseString(tdoc, inp);
 | |
|       free(inp);
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   // Cleanup
 | |
|   tidyRelease( tdoc );
 | |
| 
 | |
|   return 0;
 | |
| }
 | |
| 
 | |
| int LLVMFuzzerTestOneInput(const uint8_t* data, size_t size) {
 | |
|   TidyBuffer fuzz_toutput;
 | |
|   TidyBuffer fuzz_terror;
 | |
| 
 | |
|   tidyBufInit(&fuzz_toutput);
 | |
|   tidyBufInit(&fuzz_terror);
 | |
| 
 | |
|   TidyXhtml(data, size, &fuzz_toutput, &fuzz_terror);
 | |
| 
 | |
|   tidyBufFree(&fuzz_toutput);
 | |
|   tidyBufFree(&fuzz_terror);
 | |
| 
 | |
|   return 0;
 | |
| }
 |