1 // Copyright (C) 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /*
4  **********************************************************************
5  *   Copyright (C) 2005-2012, International Business Machines
6  *   Corporation and others.  All Rights Reserved.
7  **********************************************************************
8  */
9 
10 #ifndef __CSMATCH_H
11 #define __CSMATCH_H
12 
13 #include "unicode/uobject.h"
14 
15 #if !UCONFIG_NO_CONVERSION
16 
17 U_NAMESPACE_BEGIN
18 
19 class InputText;
20 class CharsetRecognizer;
21 
22 /*
23  * CharsetMatch represents the results produced by one Charset Recognizer for one input text
24  *              Any confidence > 0 indicates a possible match, meaning that the input bytes
25  *              are at least legal.
26  *
27  *              The full results of a detect are represented by an array of these
28  *              CharsetMatch objects, each representing a possible matching charset.
29  *
30  *              Note that a single charset recognizer may detect multiple closely related
31  *              charsets, and set different names depending on the exact input bytes seen.
32  */
33 class CharsetMatch : public UMemory
34 {
35  private:
36     InputText               *textIn;
37     int32_t                  confidence;
38     const char              *fCharsetName;
39     const char              *fLang;
40 
41  public:
42     CharsetMatch();
43 
44     /**
45       * fully set the state of this CharsetMatch.
46       * Called by the CharsetRecognizers to record match results.
47       * Default (NULL) parameters for names will be filled by calling the
48       *   corresponding getters on the recognizer.
49       */
50     void set(InputText               *input,
51              const CharsetRecognizer *cr,
52              int32_t                  conf,
53              const char              *csName=NULL,
54              const char              *lang=NULL);
55 
56     /**
57       * Return the name of the charset for this Match
58       */
59     const char *getName() const;
60 
61     const char *getLanguage()const;
62 
63     int32_t getConfidence()const;
64 
65     int32_t getUChars(UChar *buf, int32_t cap, UErrorCode *status) const;
66 };
67 
68 U_NAMESPACE_END
69 
70 #endif
71 #endif /* __CSMATCH_H */
72