src/bfile_heuristics.c

Wed, 31 May 2017 12:20:04 +0200

author
Mike Becker <universe@uap-core.de>
date
Wed, 31 May 2017 12:20:04 +0200
changeset 48
0d2c13c24fd0
parent 36
a7ff583e153f
child 57
68018eac46c3
permissions
-rw-r--r--

adds remaining autoconf files

universe@20 1 /*
universe@34 2 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS HEADER.
universe@48 3 * Copyright 2017 Mike Becker. All rights reserved.
universe@34 4 *
universe@34 5 * Redistribution and use in source and binary forms, with or without
universe@34 6 * modification, are permitted provided that the following conditions are met:
universe@34 7 *
universe@34 8 * 1. Redistributions of source code must retain the above copyright
universe@34 9 * notice, this list of conditions and the following disclaimer.
universe@34 10 *
universe@34 11 * 2. Redistributions in binary form must reproduce the above copyright
universe@34 12 * notice, this list of conditions and the following disclaimer in the
universe@34 13 * documentation and/or other materials provided with the distribution.
universe@34 14 *
universe@34 15 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
universe@34 16 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
universe@34 17 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
universe@34 18 * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
universe@34 19 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
universe@34 20 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
universe@34 21 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
universe@34 22 * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
universe@34 23 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
universe@34 24 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
universe@34 25 *
universe@20 26 * bfile_heuristics.c
universe@20 27 *
universe@20 28 * Created on: 20.10.2011
universe@20 29 * Author: Mike
universe@20 30 */
universe@20 31
universe@20 32 #include "bfile_heuristics.h"
universe@22 33 #include <ctype.h>
universe@20 34
universe@21 35 bfile_heuristics_t *new_bfile_heuristics_t() {
universe@21 36 bfile_heuristics_t *ret = malloc(sizeof(bfile_heuristics_t));
universe@21 37 ret->level = BFILE_MEDIUM_ACCURACY;
universe@22 38 bfile_reset(ret);
universe@21 39 return ret;
universe@20 40 }
universe@20 41
universe@21 42 void destroy_bfile_heuristics_t(bfile_heuristics_t *def) {
universe@21 43 free(def);
universe@20 44 }
universe@21 45
universe@22 46 void bfile_reset(bfile_heuristics_t *def) {
universe@22 47 def->bcount = 0;
universe@22 48 def->tcount = 0;
universe@22 49 }
universe@22 50
universe@21 51 bool bfile_check(bfile_heuristics_t *def, int next_char) {
universe@21 52 bool ret = false;
universe@22 53 if (def->level != BFILE_IGNORE) {
universe@22 54 def->tcount++;
universe@22 55 if (!isprint(next_char) && !isspace(next_char)) {
universe@22 56 def->bcount++;
universe@22 57 }
universe@22 58
universe@23 59 if (def->tcount > 1) { /* empty files are text files */
universe@23 60 switch (def->level) {
universe@23 61 case BFILE_LOW_ACCURACY:
universe@23 62 if (def->tcount > 15 || next_char == EOF) {
universe@23 63 ret = (1.0*def->bcount)/def->tcount > 0.32;
universe@23 64 }
universe@23 65 break;
universe@23 66 case BFILE_HIGH_ACCURACY:
universe@23 67 if (def->tcount > 500 || next_char == EOF) {
universe@23 68 ret = (1.0*def->bcount)/def->tcount > 0.1;
universe@23 69 }
universe@23 70 break;
universe@23 71 default: /* BFILE_MEDIUM_ACCURACY */
universe@23 72 if (def->tcount > 100 || next_char == EOF) {
universe@23 73 ret = (1.0*def->bcount)/def->tcount > 0.1;
universe@23 74 }
universe@23 75 break;
universe@22 76 }
universe@22 77 }
universe@22 78 }
universe@21 79
universe@21 80 return ret;
universe@21 81 }

mercurial