detect_handledata(3) Detecting character set and measuring accuracy of charset

SNOPSYS

#include <chardet.h>

short chardet_handledata (Detect ** handle, const char * inbuf, DetectObj ** outbuf);

DESCRIPTION

Storing charset and accuracy of inbuf to outbuf

handle

Detect handle resource that allocated by detect_init api.

inbuf

input string for detecting

outbuf

Stroing inforamtion of inbuf 46 The structure of outbuf is follows.

        typedef struct DetectObject {
                char * encoding;
                float confidence;
        } DetectObj;

The outbuf variable must be initialized by detect_obj_init API before calling this detect api.

RETURN VALUES

Returns following condition as case by case.

CHARDET_SUCCESS

Detecting success

CHARDET_NO_RESULT

Detection failure

CHARDET_NULL_OBJECT

Don't initializing outbuf with chardet_obj_init

CHARDET_OUT_OF_MEMORY

Occuring out of memory at internal API

EXAMPLE

#include <chardet.h>
int main (void) {
        Detect    * d;
        DetectObj * obj;
        int i, arrayNum;
        char *str[] = {
                "this is ascii",
                "이건 euc-kr 입니다."
        };
        arrayNum = sizeof (str) / sizeof (str[0]);
        if ( (d = detect_init ()) == NULL ) {
                fprintf (stderr, "chardet handle initialize failed\n");
                return CHARDET_MEM_ALLOCATED_FAIL;
        }
        for ( i=0; i<arrayNum; i++ ) {
                detect_reset (&d);
                if ( (obj = detect_obj_init ()) == NULL ) {
                        fprintf (stderr, "Memory Allocation failed\n");
                        return CHARDET_MEM_ALLOCATED_FAIL;
                }
                switch (detect_handledata (&d, "안녕하세요", &obj)) {
                        case CHARDET_OUT_OF_MEMORY :
                                fprintf (stderr, "On handle processing, occured out of memory\n");
                                detect_obj_free (&obj);
                                return CHARDET_OUT_OF_MEMORY;
                        case CHARDET_NULL_OBJECT :
                                fprintf (stderr,
                                                "2st argument of chardet() is must memory allocation "
                                                "with detect_obj_init API\n");
                                return CHARDET_NULL_OBJECT;
                }
                printf ("encoding: %s, confidence: %f\n", obj->encoding, obj->confidence);
                detect_obj_free (&obj);
        }
        detect_destroy (&d);
    return 0;
}

AUTHORS

JoungKyun.Kim <http://oops.org>

BUG REPORTS

Use QnA board on http://oops.org