ezra100 · January 21, 2023 23:03
diff --git a/A.steps.md b/A.steps.md
diff --git a/language_identifier_lib.cc b/language_identifier_lib.cc
 /* Copyright 2016 Google Inc. All Rights Reserved.

 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/

 #include <iostream>
 #include <map>
 #include <string>

 #include "base.h"
 #include "nnet_language_identifier.h"
 using chrome_lang_id::NNetLanguageIdentifier;

 using namespace std;
 #ifdef __linux__
 #define EXPORT __attribute__((visibility("default")))
 #else
 #if defined(_MSC_VER)
 #define EXPORT __declspec(dllexport)
 #else
 #define EXPORT __attribute__((visibility("default")))
 #endif
 #endif

 NNetLanguageIdentifier *lang_id = new NNetLanguageIdentifier(0, 1000);

 // Min:
 // Minimum number of bytes needed to make a prediction. If the default
 // constructor is called, this variable is equal to kMinNumBytesToConsider.
 // Max:
 // Maximum number of bytes to use to make a prediction. If the default
 // constructor is called, this variable is equal to kMaxNumBytesToConsider.
 EXPORT void setMinMaxBytes(int min, int max) {
    delete lang_id;
    lang_id = new NNetLanguageIdentifier(min, max);
 }

 // @arr assumed to be be a pointer to an array with the size of @numberOfLangs
 EXPORT void findTopNMostFreqLangs(const string &text, int numberOfLangs,
                                  NNetLanguageIdentifier::Result *arr) {
    auto results = lang_id->FindTopNMostFreqLangs(text, numberOfLangs);
    std::copy(results.begin(), results.end(), arr);
 }

 EXPORT NNetLanguageIdentifier::Result *
 findTopNMostFreqLangs(const string &text, int numberOfLangs) {
    auto results = lang_id->FindTopNMostFreqLangs(text, numberOfLangs);
    NNetLanguageIdentifier::Result *arr =
        new NNetLanguageIdentifier::Result[numberOfLangs];
    findTopNMostFreqLangs(text, numberOfLangs, arr);
    return arr;
 }

 EXPORT NNetLanguageIdentifier::Result findLanguage(const string &text) {
    return lang_id->FindLanguage(text);
 }
diff --git a/lIdentifier.hpp b/lIdentifier.hpp
 #include <string>
 #include <vector>
 #include <map>


 #ifdef __linux__
 #define IMPORT
 #define WMAIN main
 #define string string
 #define WCHAR char
 #else
 #define IMPORT __declspec(dllimport)
 #define WMAIN main
 #define WSTRING string
 #define WCHAR char
 #endif

 using namespace std;
 namespace chrome_lang_id {
 	namespace NNetLanguageIdentifier {

 		struct Result {
 			string language;
 			float probability = 0.0;  // Language probability.
 			bool is_reliable = false; // Whether the prediction is reliable.

 			// Proportion of bytes associated with the language. If FindLanguage
 			// is called, this variable is set to 1.
 			float proportion = 0.0;
 			// Result(PointerResult pResult){
 			//     this->language = std::string(pResult.language);
 			//     this->probability = pResult.probability;
 			//     this->proportion = pResult.proportion;
 			//     this->is_reliable = pResult.is_reliable;
 			// }
 		};
 	} // namespace NNetLanguageIdentifier
 } // namespace chrome_lang_id
 using namespace chrome_lang_id::NNetLanguageIdentifier;
 using namespace chrome_lang_id;

 // Min:
 // Minimum number of bytes needed to make a prediction. If the default
 // constructor is called, this variable is equal to kMinNumBytesToConsider.
 // Max:
 // Maximum number of bytes to use to make a prediction. If the default
 // constructor is called, this variable is equal to kMaxNumBytesToConsider.
 IMPORT void setMinMaxBytes(int min, int max);

 IMPORT NNetLanguageIdentifier::Result *findTopNMostFreqLangs(const string &text,
 	int numberOfLangs);
 IMPORT void findTopNMostFreqLangs(const string &text,
 	int numberOfLangs, NNetLanguageIdentifier::Result *);
 IMPORT Result findLanguage(const string &text);


 map<std::string, std::string> codeToLangName{
 	{"ab", "Abkhazian"},
 	{"aa", "Afar"},
 	{"af", "Afrikaans"},
 	{"sq", "Albanian"},
 	{"am", "Amharic"},
 	{"ar", "Arabic"},
 	{"an", "Aragonese"},
 	{"hy", "Armenian"},
 	{"as", "Assamese"},
 	{"ae", "Avestan"},
 	{"ay", "Aymara"},
 	{"az", "Azerbaijani"},
 	{"ba", "Bashkir"},
 	{"eu", "Basque"},
 	{"be", "Belarusian"},
 	{"bn", "Bengali"},
 	{"bh", "Bihari"},
 	{"bi", "Bislama"},
 	{"bs", "Bosnian"},
 	{"br", "Breton"},
 	{"bg", "Bulgarian"},
 	{"my", "Burmese"},
 	{"ca", "Catalan"},
 	{"ch", "Chamorro"},
 	{"ce", "Chechen"},
 	{"zh", "Chinese"},
 	{"cu", "Church Slavic; Slavonic; Old Bulgarian"},
 	{"cv", "Chuvash"},
 	{"kw", "Cornish"},
 	{"co", "Corsican"},
 	{"hr", "Croatian"},
 	{"cs", "Czech"},
 	{"da", "Danish"},
 	{"dv", "Divehi; Dhivehi; Maldivian"},
 	{"nl", "Dutch"},
 	{"dz", "Dzongkha"},
 	{"en", "English"},
 	{"eo", "Esperanto"},
 	{"et", "Estonian"},
 	{"fo", "Faroese"},
 	{"fj", "Fijian"},
 	{"fi", "Finnish"},
 	{"fr", "French"},
 	{"gd", "Gaelic; Scottish Gaelic"},
 	{"gl", "Galician"},
 	{"ka", "Georgian"},
 	{"de", "German"},
 	{"el", "Greek, Modern (1453-)"},
 	{"gn", "Guarani"},
 	{"gu", "Gujarati"},
 	{"ht", "Haitian; Haitian Creole"},
 	{"ha", "Hausa"},
 	{"he", "Hebrew"},
 	{"hz", "Herero"},
 	{"hi", "Hindi"},
 	{"ho", "Hiri Motu"},
 	{"hu", "Hungarian"},
 	{"is", "Icelandic"},
 	{"io", "Ido"},
 	{"id", "Indonesian"},
 	{"ia", "Interlingua (International Auxiliary Language Association)"},
 	{"ie", "Interlingue"},
 	{"iu", "Inuktitut"},
 	{"ik", "Inupiaq"},
 	{"ga", "Irish"},
 	{"it", "Italian"},
 	{"ja", "Japanese"},
 	{"jv", "Javanese"},
 	{"kl", "Kalaallisut"},
 	{"kn", "Kannada"},
 	{"ks", "Kashmiri"},
 	{"kk", "Kazakh"},
 	{"km", "Khmer"},
 	{"ki", "Kikuyu; Gikuyu"},
 	{"rw", "Kinyarwanda"},
 	{"ky", "Kirghiz"},
 	{"kv", "Komi"},
 	{"ko", "Korean"},
 	{"kj", "Kuanyama; Kwanyama"},
 	{"ku", "Kurdish"},
 	{"lo", "Lao"},
 	{"la", "Latin"},
 	{"lv", "Latvian"},
 	{"li", "Limburgan; Limburger; Limburgish"},
 	{"ln", "Lingala"},
 	{"lt", "Lithuanian"},
 	{"lb", "Luxembourgish; Letzeburgesch"},
 	{"mk", "Macedonian"},
 	{"mg", "Malagasy"},
 	{"ms", "Malay"},
 	{"ml", "Malayalam"},
 	{"mt", "Maltese"},
 	{"gv", "Manx"},
 	{"mi", "Maori"},
 	{"mr", "Marathi"},
 	{"mh", "Marshallese"},
 	{"mo", "Moldavian"},
 	{"mn", "Mongolian"},
 	{"na", "Nauru"},
 	{"nv", "Navaho, Navajo"},
 	{"nd", "Ndebele, North"},
 	{"nr", "Ndebele, South"},
 	{"ng", "Ndonga"},
 	{"ne", "Nepali"},
 	{"se", "Northern Sami"},
 	{"no", "Norwegian"},
 	{"nb", "Norwegian Bokmal"},
 	{"nn", "Norwegian Nynorsk"},
 	{"ny", "Nyanja; Chichewa; Chewa"},
 	{"oc", "Occitan (post 1500); Provencal"},
 	{"or", "Oriya"},
 	{"om", "Oromo"},
 	{"os", "Ossetian; Ossetic"},
 	{"pi", "Pali"},
 	{"pa", "Panjabi"},
 	{"fa", "Persian"},
 	{"pl", "Polish"},
 	{"pt", "Portuguese"},
 	{"ps", "Pushto"},
 	{"qu", "Quechua"},
 	{"rm", "Raeto-Romance"},
 	{"ro", "Romanian"},
 	{"rn", "Rundi"},
 	{"ru", "Russian"},
 	{"sm", "Samoan"},
 	{"sg", "Sango"},
 	{"sa", "Sanskrit"},
 	{"sc", "Sardinian"},
 	{"sr", "Serbian"},
 	{"sn", "Shona"},
 	{"ii", "Sichuan Yi"},
 	{"sd", "Sindhi"},
 	{"si", "Sinhala; Sinhalese"},
 	{"sk", "Slovak"},
 	{"sl", "Slovenian"},
 	{"so", "Somali"},
 	{"st", "Sotho, Southern"},
 	{"es", "Spanish; Castilian"},
 	{"su", "Sundanese"},
 	{"sw", "Swahili"},
 	{"ss", "Swati"},
 	{"sv", "Swedish"},
 	{"tl", "Tagalog"},
 	{"ty", "Tahitian"},
 	{"tg", "Tajik"},
 	{"ta", "Tamil"},
 	{"tt", "Tatar"},
 	{"te", "Telugu"},
 	{"th", "Thai"},
 	{"bo", "Tibetan"},
 	{"ti", "Tigrinya"},
 	{"to", "Tonga (Tonga Islands)"},
 	{"ts", "Tsonga"},
 	{"tn", "Tswana"},
 	{"tr", "Turkish"},
 	{"tk", "Turkmen"},
 	{"tw", "Twi"},
 	{"ug", "Uighur"},
 	{"uk", "Ukrainian"},
 	{"ur", "Urdu"},
 	{"uz", "Uzbek"},
 	{"vi", "Vietnamese"},
 	{"vo", "Volapuk"},
 	{"wa", "Walloon"},
 	{"cy", "Welsh"},
 	{"fy", "Western Frisian"},
 	{"wo", "Wolof"},
 	{"xh", "Xhosa"},
 	{"yi", "Yiddish"},
 	{"yo", "Yoruba"},
 	{"za", "Zhuang; Chuang"},
 	{"zu", "Zulu"} ,
 	{"und", "Undefined Language"}
 };

diff --git a/main.cpp b/main.cpp
 #pragma once
 #include "lIdentifier.hpp"
 #include <algorithm>
 #include <codecvt>
 #include <iostream>
 #include <locale>
 #include <map>
 #include <vector>

 #ifdef __linux__
 #define WMAIN main
 #define WSTRING string
 #define WCHAR char
 #else
 #define WMAIN wmain
 #define WSTRING wstring
 #define WCHAR wchar_t
 #endif

 using namespace std;


 void runTopFrequent(const string &text, int numOfLangs);

 clock_t startTime;

 // working with the already defined WMAIN WCHAR gave me errors
 #ifdef __linux__
 int main(int argc, char *argv[])
 #else
 int wmain(int argc, wchar_t *argv[])
 #endif
 {
    if (argc < 2) {
        std::cout << "usage: blah blach " << argv[0] << endl;
        return 0;
    }
 #ifdef __linux__
    std::string text(argv[1]);
 #else
    std::wstring wText(argv[1]);
    // see https://stackoverflow.com/a/18374698/4483033
    // use converter (.to_bytes: wstr->str, .from_bytes: str->wstr)
    std::string text =
        std::wstring_convert<std::codecvt_utf8<wchar_t>>().to_bytes(wText);
 #endif // __linux__
    if (argc < 3) {
        Result result = findLanguage(text);
        std::cout << "text: " << text << std::endl
                  << "  language: " << result.language << std::endl
                  << "  language name: " << codeToLangName[result.language]
                  << std::endl
                  << "  probability: " << result.probability << std::endl
                  << "  reliable: " << result.is_reliable << std::endl
                  << "  proportion: " << result.proportion << std::endl
                  << std::endl;
        return 0;
    }
    int numOfLangs = stoi(argv[2]);
    runTopFrequent(text, numOfLangs);
    return 0;
 }

 void runTopFrequent(const string &text, int numOfLangs) {
    Result *results = new Result[numOfLangs];
    findTopNMostFreqLangs(text, numOfLangs, results);
    for (int i = 0; i < numOfLangs; i++) {
        auto result = results[i];
        std::cout << "  language code: " << result.language << std::endl
                  << "  language name: " << codeToLangName[result.language]
                  << std::endl
                  << "  probability: " << result.probability << std::endl
                  << "  reliable: " << result.is_reliable << std::endl
                  << "  proportion: " << result.proportion << std::endl
                  << std::endl;
    }
    delete[] results;
 }
	/* Copyright 2016 Google Inc. All Rights Reserved.

	Licensed under the Apache License, Version 2.0 (the "License");
	you may not use this file except in compliance with the License.
	You may obtain a copy of the License at

	http://www.apache.org/licenses/LICENSE-2.0

	Unless required by applicable law or agreed to in writing, software
	distributed under the License is distributed on an "AS IS" BASIS,
	WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	See the License for the specific language governing permissions and
	limitations under the License.
	==============================================================================*/

	#include <iostream>
	#include <map>
	#include <string>

	#include "base.h"
	#include "nnet_language_identifier.h"
	using chrome_lang_id::NNetLanguageIdentifier;

	using namespace std;
	#ifdef __linux__
	#define EXPORT __attribute__((visibility("default")))
	#else
	#if defined(_MSC_VER)
	#define EXPORT __declspec(dllexport)
	#else
	#define EXPORT __attribute__((visibility("default")))
	#endif
	#endif

	NNetLanguageIdentifier *lang_id = new NNetLanguageIdentifier(0, 1000);

	// Min:
	// Minimum number of bytes needed to make a prediction. If the default
	// constructor is called, this variable is equal to kMinNumBytesToConsider.
	// Max:
	// Maximum number of bytes to use to make a prediction. If the default
	// constructor is called, this variable is equal to kMaxNumBytesToConsider.
	EXPORT void setMinMaxBytes(int min, int max) {
	delete lang_id;
	lang_id = new NNetLanguageIdentifier(min, max);
	}

	// @arr assumed to be be a pointer to an array with the size of @numberOfLangs
	EXPORT void findTopNMostFreqLangs(const string &text, int numberOfLangs,
	NNetLanguageIdentifier::Result *arr) {
	auto results = lang_id->FindTopNMostFreqLangs(text, numberOfLangs);
	std::copy(results.begin(), results.end(), arr);
	}

	EXPORT NNetLanguageIdentifier::Result *
	findTopNMostFreqLangs(const string &text, int numberOfLangs) {
	auto results = lang_id->FindTopNMostFreqLangs(text, numberOfLangs);
	NNetLanguageIdentifier::Result *arr =
	new NNetLanguageIdentifier::Result[numberOfLangs];
	findTopNMostFreqLangs(text, numberOfLangs, arr);
	return arr;
	}

	EXPORT NNetLanguageIdentifier::Result findLanguage(const string &text) {
	return lang_id->FindLanguage(text);
	}
	#include <string>
	#include <vector>
	#include <map>


	#ifdef __linux__
	#define IMPORT
	#define WMAIN main
	#define string string
	#define WCHAR char
	#else
	#define IMPORT __declspec(dllimport)
	#define WMAIN main
	#define WSTRING string
	#define WCHAR char
	#endif

	using namespace std;
	namespace chrome_lang_id {
	namespace NNetLanguageIdentifier {

	struct Result {
	string language;
	float probability = 0.0; // Language probability.
	bool is_reliable = false; // Whether the prediction is reliable.

	// Proportion of bytes associated with the language. If FindLanguage
	// is called, this variable is set to 1.
	float proportion = 0.0;
	// Result(PointerResult pResult){
	// this->language = std::string(pResult.language);
	// this->probability = pResult.probability;
	// this->proportion = pResult.proportion;
	// this->is_reliable = pResult.is_reliable;
	// }
	};
	} // namespace NNetLanguageIdentifier
	} // namespace chrome_lang_id
	using namespace chrome_lang_id::NNetLanguageIdentifier;
	using namespace chrome_lang_id;

	// Min:
	// Minimum number of bytes needed to make a prediction. If the default
	// constructor is called, this variable is equal to kMinNumBytesToConsider.
	// Max:
	// Maximum number of bytes to use to make a prediction. If the default
	// constructor is called, this variable is equal to kMaxNumBytesToConsider.
	IMPORT void setMinMaxBytes(int min, int max);

	IMPORT NNetLanguageIdentifier::Result *findTopNMostFreqLangs(const string &text,
	int numberOfLangs);
	IMPORT void findTopNMostFreqLangs(const string &text,
	int numberOfLangs, NNetLanguageIdentifier::Result *);
	IMPORT Result findLanguage(const string &text);


	map<std::string, std::string> codeToLangName{
	{"ab", "Abkhazian"},
	{"aa", "Afar"},
	{"af", "Afrikaans"},
	{"sq", "Albanian"},
	{"am", "Amharic"},
	{"ar", "Arabic"},
	{"an", "Aragonese"},
	{"hy", "Armenian"},
	{"as", "Assamese"},
	{"ae", "Avestan"},
	{"ay", "Aymara"},
	{"az", "Azerbaijani"},
	{"ba", "Bashkir"},
	{"eu", "Basque"},
	{"be", "Belarusian"},
	{"bn", "Bengali"},
	{"bh", "Bihari"},
	{"bi", "Bislama"},
	{"bs", "Bosnian"},
	{"br", "Breton"},
	{"bg", "Bulgarian"},
	{"my", "Burmese"},
	{"ca", "Catalan"},
	{"ch", "Chamorro"},
	{"ce", "Chechen"},
	{"zh", "Chinese"},
	{"cu", "Church Slavic; Slavonic; Old Bulgarian"},
	{"cv", "Chuvash"},
	{"kw", "Cornish"},
	{"co", "Corsican"},
	{"hr", "Croatian"},
	{"cs", "Czech"},
	{"da", "Danish"},
	{"dv", "Divehi; Dhivehi; Maldivian"},
	{"nl", "Dutch"},
	{"dz", "Dzongkha"},
	{"en", "English"},
	{"eo", "Esperanto"},
	{"et", "Estonian"},
	{"fo", "Faroese"},
	{"fj", "Fijian"},
	{"fi", "Finnish"},
	{"fr", "French"},
	{"gd", "Gaelic; Scottish Gaelic"},
	{"gl", "Galician"},
	{"ka", "Georgian"},
	{"de", "German"},
	{"el", "Greek, Modern (1453-)"},
	{"gn", "Guarani"},
	{"gu", "Gujarati"},
	{"ht", "Haitian; Haitian Creole"},
	{"ha", "Hausa"},
	{"he", "Hebrew"},
	{"hz", "Herero"},
	{"hi", "Hindi"},
	{"ho", "Hiri Motu"},
	{"hu", "Hungarian"},
	{"is", "Icelandic"},
	{"io", "Ido"},
	{"id", "Indonesian"},
	{"ia", "Interlingua (International Auxiliary Language Association)"},
	{"ie", "Interlingue"},
	{"iu", "Inuktitut"},
	{"ik", "Inupiaq"},
	{"ga", "Irish"},
	{"it", "Italian"},
	{"ja", "Japanese"},
	{"jv", "Javanese"},
	{"kl", "Kalaallisut"},
	{"kn", "Kannada"},
	{"ks", "Kashmiri"},
	{"kk", "Kazakh"},
	{"km", "Khmer"},
	{"ki", "Kikuyu; Gikuyu"},
	{"rw", "Kinyarwanda"},
	{"ky", "Kirghiz"},
	{"kv", "Komi"},
	{"ko", "Korean"},
	{"kj", "Kuanyama; Kwanyama"},
	{"ku", "Kurdish"},
	{"lo", "Lao"},
	{"la", "Latin"},
	{"lv", "Latvian"},
	{"li", "Limburgan; Limburger; Limburgish"},
	{"ln", "Lingala"},
	{"lt", "Lithuanian"},
	{"lb", "Luxembourgish; Letzeburgesch"},
	{"mk", "Macedonian"},
	{"mg", "Malagasy"},
	{"ms", "Malay"},
	{"ml", "Malayalam"},
	{"mt", "Maltese"},
	{"gv", "Manx"},
	{"mi", "Maori"},
	{"mr", "Marathi"},
	{"mh", "Marshallese"},
	{"mo", "Moldavian"},
	{"mn", "Mongolian"},
	{"na", "Nauru"},
	{"nv", "Navaho, Navajo"},
	{"nd", "Ndebele, North"},
	{"nr", "Ndebele, South"},
	{"ng", "Ndonga"},
	{"ne", "Nepali"},
	{"se", "Northern Sami"},
	{"no", "Norwegian"},
	{"nb", "Norwegian Bokmal"},
	{"nn", "Norwegian Nynorsk"},
	{"ny", "Nyanja; Chichewa; Chewa"},
	{"oc", "Occitan (post 1500); Provencal"},
	{"or", "Oriya"},
	{"om", "Oromo"},
	{"os", "Ossetian; Ossetic"},
	{"pi", "Pali"},
	{"pa", "Panjabi"},
	{"fa", "Persian"},
	{"pl", "Polish"},
	{"pt", "Portuguese"},
	{"ps", "Pushto"},
	{"qu", "Quechua"},
	{"rm", "Raeto-Romance"},
	{"ro", "Romanian"},
	{"rn", "Rundi"},
	{"ru", "Russian"},
	{"sm", "Samoan"},
	{"sg", "Sango"},
	{"sa", "Sanskrit"},
	{"sc", "Sardinian"},
	{"sr", "Serbian"},
	{"sn", "Shona"},
	{"ii", "Sichuan Yi"},
	{"sd", "Sindhi"},
	{"si", "Sinhala; Sinhalese"},
	{"sk", "Slovak"},
	{"sl", "Slovenian"},
	{"so", "Somali"},
	{"st", "Sotho, Southern"},
	{"es", "Spanish; Castilian"},
	{"su", "Sundanese"},
	{"sw", "Swahili"},
	{"ss", "Swati"},
	{"sv", "Swedish"},
	{"tl", "Tagalog"},
	{"ty", "Tahitian"},
	{"tg", "Tajik"},
	{"ta", "Tamil"},
	{"tt", "Tatar"},
	{"te", "Telugu"},
	{"th", "Thai"},
	{"bo", "Tibetan"},
	{"ti", "Tigrinya"},
	{"to", "Tonga (Tonga Islands)"},
	{"ts", "Tsonga"},
	{"tn", "Tswana"},
	{"tr", "Turkish"},
	{"tk", "Turkmen"},
	{"tw", "Twi"},
	{"ug", "Uighur"},
	{"uk", "Ukrainian"},
	{"ur", "Urdu"},
	{"uz", "Uzbek"},
	{"vi", "Vietnamese"},
	{"vo", "Volapuk"},
	{"wa", "Walloon"},
	{"cy", "Welsh"},
	{"fy", "Western Frisian"},
	{"wo", "Wolof"},
	{"xh", "Xhosa"},
	{"yi", "Yiddish"},
	{"yo", "Yoruba"},
	{"za", "Zhuang; Chuang"},
	{"zu", "Zulu"} ,
	{"und", "Undefined Language"}
	};
	#pragma once
	#include "lIdentifier.hpp"
	#include <algorithm>
	#include <codecvt>
	#include <iostream>
	#include <locale>
	#include <map>
	#include <vector>

	#ifdef __linux__
	#define WMAIN main
	#define WSTRING string
	#define WCHAR char
	#else
	#define WMAIN wmain
	#define WSTRING wstring
	#define WCHAR wchar_t
	#endif

	using namespace std;


	void runTopFrequent(const string &text, int numOfLangs);

	clock_t startTime;

	// working with the already defined WMAIN WCHAR gave me errors
	#ifdef __linux__
	int main(int argc, char *argv[])
	#else
	int wmain(int argc, wchar_t *argv[])
	#endif
	{
	if (argc < 2) {
	std::cout << "usage: blah blach " << argv[0] << endl;
	return 0;
	}
	#ifdef __linux__
	std::string text(argv[1]);
	#else
	std::wstring wText(argv[1]);
	// see https://stackoverflow.com/a/18374698/4483033
	// use converter (.to_bytes: wstr->str, .from_bytes: str->wstr)
	std::string text =
	std::wstring_convert<std::codecvt_utf8<wchar_t>>().to_bytes(wText);
	#endif // __linux__
	if (argc < 3) {
	Result result = findLanguage(text);
	std::cout << "text: " << text << std::endl
	<< " language: " << result.language << std::endl
	<< " language name: " << codeToLangName[result.language]
	<< std::endl
	<< " probability: " << result.probability << std::endl
	<< " reliable: " << result.is_reliable << std::endl
	<< " proportion: " << result.proportion << std::endl
	<< std::endl;
	return 0;
	}
	int numOfLangs = stoi(argv[2]);
	runTopFrequent(text, numOfLangs);
	return 0;
	}

	void runTopFrequent(const string &text, int numOfLangs) {
	Result *results = new Result[numOfLangs];
	findTopNMostFreqLangs(text, numOfLangs, results);
	for (int i = 0; i < numOfLangs; i++) {
	auto result = results[i];
	std::cout << " language code: " << result.language << std::endl
	<< " language name: " << codeToLangName[result.language]
	<< std::endl
	<< " probability: " << result.probability << std::endl
	<< " reliable: " << result.is_reliable << std::endl
	<< " proportion: " << result.proportion << std::endl
	<< std::endl;
	}
	delete[] results;
	}