/* * testtextcat.c -- a simple commandline classifier. Feed it input on * standard in and it will feed you a classification on standard out. * * Copyright (C) 2003 WiseGuys Internet B.V. * * THE BSD LICENSE * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * * - Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * * - Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the * distribution. * * - Neither the name of the WiseGuys Internet B.V. nor the names of * its contributors may be used to endorse or promote products derived * from this software without specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ #include "config.h" #ifdef HAVE_STDLIB_H #include #endif #ifdef HAVE_STRINGS_H #include #endif #ifdef HAVE_STRING_H #include #endif #include "textcat.h" #include "common_impl.h" #define BLOCKSIZE 4096 char *myread(FILE *fp) { char *buf; size_t size = 0; size_t maxsize = BLOCKSIZE*2; buf = (char *)wg_malloc( maxsize ); do { size_t hasread = fread( buf+size, 1, BLOCKSIZE, fp ); size += hasread; if ( size + BLOCKSIZE > maxsize ) { maxsize *= 2; buf = (char *)wg_realloc( buf, maxsize ); } } while (!feof(stdin)); buf[size] = '\0'; buf = (char *)wg_realloc( buf, size+1 ); return buf; } int main( int argc, char **argv ) { void *h; char *result; wgtimer_t tm; char *buf; printf("%s\n", textcat_Version()); h = textcat_Init( argc>1?argv[1]:"conf.txt" ); if ( !h ) { printf("Unable to init. Aborting.\n"); exit(-1); } buf = myread(stdin); wg_timerstart(&tm); /*** We only need a little text to determine the language ***/ buf[1024] = '\0'; result = textcat_Classify( h, buf, strlen(buf)+1 ); printf("Result == %s\n", result); fprintf(stderr, "That took %u ms.\n", wg_timerstop(&tm)/1000); textcat_Done(h); wg_free(buf); return 0; }