{ "info": { "author": "Shahab Sabahi", "author_email": "sabahi.s@mysol-gc.jp", "bugtrack_url": null, "classifiers": [ "Intended Audience :: Developers", "Intended Audience :: Science/Research", "Programming Language :: Python", "Programming Language :: Python :: 3.7" ], "description": "*** Version-5 release with accuracy improvement *** \nThis program may take a minute or so to get results showed on the screen,\nplease be patient.\n\nSpoken Language Identification is the process of determining and classifying natural language \nfrom a given content and dataset. Employing an acoustic model and a language model, Data of \naudio files is processed to extract useful features for performing Machine Learning. \nThe acoustic features for SPOKEN LANGUAGE IDENTIFICATION are namely standard features such \nas Mel-Frequency Cepstral Coefficients (MFCC), Shifted Delta Cepstral (SDC), while for the \nlanguage features the Gaussian Mixture Model (GMM) and the i-vector based framework are \nused. \n\nHowever, the Machine Learning process based on extract features remains a challenge. \nOptimisation needs to be improved in order to capture embedded knowledge on the extracted \nfeatures. CNN (Convolutional Neural Networks), RNN (Recurrent Neural Networks) and ELM (the \nExtreme Learning Machine) are promising as effective learning architectures used to perform \nclassification and further complex analysis and are extremely useful to train a single \nhidden layer neural network. However, by now, the learning process of these models is not \nentirely effective due to the selection methods of weights within the input hidden layer.\n\nmyspokenlanguagedetection is a preliminary package structured for SPOKEN LANGUAGE \nIDENTIFICATION based on standard feature extraction\nand CNN and RNN. An optimisation approach was employed as the benchmark and improved by \naltering the selection phase of the optimisation process. The selection process is performed\nincorporating deferent methods. The results are generated based on SPOKEN LANGUAGE \nIDENTIFICATION with the datasets created from eighteen different languages. The results of \nthe study indicate the performance of Machine Learning highly correlated with the soundness \nof architecture of Neural Networks and co-existence of acoustic and language models.\n\nTHIS version of myspokenlanguagedetection was trained to detect \"French\", \"English\", \"Spanish\", \n\"Italian\", \"Deutsch\", \"Russian\", \"Portuguese\", \"Swedish\", and \"Japanese\" and to some lower \nextent other 40 languages. We will complete the machine training sessions for more languages \nalong with increasing the accuracy of the languages identification process.\n\n=============\nInstallation\n=============\nmyspokenlanguagedetection can be installed like any other Python library, using (a recent version of) the\nPython package manager pip, on Linux, macOS, and Windows:\n\n------------------pip install myspokenlanguagedetection\n\nor, to update your installed version to the latest release:\n------------------- pip install -u myspokenlanguagedetection \t---------------------------------\n\nRecording files must be 25 sec. or longer of audio and in *.wav PCM/LPCM format, recorded at 48 kHz \nsample frame and 24-32 bits of resolution or AIFF, AIFF-C, FLAC: must be native FLAC format; \nOGG-FLAC is not supported.\n\nplease check out https://github.com/Shahabks/myspokenlanguageid \n\nmyspokenlanguagedetection was developed by MYOLUTION Lab in Japan. It is part of New Generation of \nVoice Recognition and Acoustic & Language modeling Project in MYSOLUTION Lab. That is planned to \nenrich the functionality of myspokenlanguagedetection by adding more advanced functions.\n\n", "description_content_type": "", "docs_url": null, "download_url": "", "downloads": { "last_day": -1, "last_month": -1, "last_week": -1 }, "home_page": "https://github.com/Shahabks/myspokenlanguageid", "keywords": "speech signal processing,Natural Language Processing and Understanding", "license": "MIT", "maintainer": "", "maintainer_email": "", "name": "myspokenlanguagedetection", "package_url": "https://pypi.org/project/myspokenlanguagedetection/", "platform": "", "project_url": "https://pypi.org/project/myspokenlanguagedetection/", "project_urls": { "Homepage": "https://github.com/Shahabks/myspokenlanguageid" }, "release_url": "https://pypi.org/project/myspokenlanguagedetection/5/", "requires_dist": [ "numpy (>=1.15.2)", "SpeechRecognition (>=3.8.1)", "langdetect (>=1.0.7)", "pickleshare (>=0.7.5)", "nagisa (>=0.2.0)" ], "requires_python": "", "summary": "Spoken language identification with CNN and RNN - Improved Version: accuracy up", "version": "5" }, "last_serial": 4781069, "releases": { "3": [ { "comment_text": "", "digests": { "md5": "c9448836800aac314e8fbfcf1ef8a231", "sha256": "1bad53ff53ea33507799c397a9aefa8511a39919165faa149d062c3360f2a6ab" }, "downloads": -1, "filename": "myspokenlanguagedetection-3-py3-none-any.whl", "has_sig": false, "md5_digest": "c9448836800aac314e8fbfcf1ef8a231", "packagetype": "bdist_wheel", "python_version": "py3", "requires_python": null, "size": 27668, "upload_time": "2019-01-01T16:24:26", "url": "https://files.pythonhosted.org/packages/73/81/356044ae6043d44a730d3f097803603db5270d82013d522306d891eb4698/myspokenlanguagedetection-3-py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "bee3ac3a5aea55721d8aa8955e9020fc", "sha256": "150e5ab5a95dc0b400094882f2f7a7686232aa4dabdec6a69ae7b3b5f44124b3" }, "downloads": -1, "filename": "myspokenlanguagedetection-3.tar.gz", "has_sig": false, "md5_digest": "bee3ac3a5aea55721d8aa8955e9020fc", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 3404, "upload_time": "2019-01-01T16:24:28", "url": "https://files.pythonhosted.org/packages/12/fc/55829afde34244715cec04e6132ac475d3488078f4db1c8e304f318709f4/myspokenlanguagedetection-3.tar.gz" } ], "4": [ { "comment_text": "", "digests": { "md5": "03c490183c0955eb0ffc28283ec35380", "sha256": "54dca14421f50f6138512fd8b865849365e302b86eab57d378d09cc3ffd4570f" }, "downloads": -1, "filename": "myspokenlanguagedetection-4-py3-none-any.whl", "has_sig": false, "md5_digest": "03c490183c0955eb0ffc28283ec35380", "packagetype": "bdist_wheel", "python_version": "py3", "requires_python": null, "size": 27713, "upload_time": "2019-01-02T15:45:04", "url": "https://files.pythonhosted.org/packages/22/55/b24bf9436577cd228d597141b0f4119d73059c4e5ff62e11d11f8da7392b/myspokenlanguagedetection-4-py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "63fe7e775192d414f97f7b3de1d3e866", "sha256": "50d0f87565721975f7dd47688debf9b0a9e5a3e940db63291c3585055405fd62" }, "downloads": -1, "filename": "myspokenlanguagedetection-4.tar.gz", "has_sig": false, "md5_digest": "63fe7e775192d414f97f7b3de1d3e866", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 3467, "upload_time": "2019-01-02T15:45:05", "url": "https://files.pythonhosted.org/packages/d7/c3/a24de99190e1adaf6980fbf91e23d159f5eeb7b0b9a500a6bafa9640d89d/myspokenlanguagedetection-4.tar.gz" } ], "5": [ { "comment_text": "", "digests": { "md5": "a71d96b4ce9ca4299410a49bf789e605", "sha256": "daca655a6255aa28a6b58996fa7a273683a7d347b305cb792f22052a1a2dc908" }, "downloads": -1, "filename": "myspokenlanguagedetection-5-py3-none-any.whl", "has_sig": false, "md5_digest": "a71d96b4ce9ca4299410a49bf789e605", "packagetype": "bdist_wheel", "python_version": "py3", "requires_python": null, "size": 3970, "upload_time": "2019-02-05T08:25:30", "url": "https://files.pythonhosted.org/packages/73/0e/8c894989e6750f508ccc6d94783340ceec64c7b9fcf1070792ab5a9a0d07/myspokenlanguagedetection-5-py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "b3501fa1aff7727a15d64fa00c9f1aa4", "sha256": "c7eb4a9faaf9606948bd3187181aa85caf9555dd26ba9484cad31c14995c35c6" }, "downloads": -1, "filename": "myspokenlanguagedetection-5.tar.gz", "has_sig": false, "md5_digest": "b3501fa1aff7727a15d64fa00c9f1aa4", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 3696, "upload_time": "2019-02-05T08:25:31", "url": "https://files.pythonhosted.org/packages/71/b6/31426eff7a7bc02b0b990378ecbfd690ce9ab98af38220cc57f535f5ae7e/myspokenlanguagedetection-5.tar.gz" } ] }, "urls": [ { "comment_text": "", "digests": { "md5": "a71d96b4ce9ca4299410a49bf789e605", "sha256": "daca655a6255aa28a6b58996fa7a273683a7d347b305cb792f22052a1a2dc908" }, "downloads": -1, "filename": "myspokenlanguagedetection-5-py3-none-any.whl", "has_sig": false, "md5_digest": "a71d96b4ce9ca4299410a49bf789e605", "packagetype": "bdist_wheel", "python_version": "py3", "requires_python": null, "size": 3970, "upload_time": "2019-02-05T08:25:30", "url": "https://files.pythonhosted.org/packages/73/0e/8c894989e6750f508ccc6d94783340ceec64c7b9fcf1070792ab5a9a0d07/myspokenlanguagedetection-5-py3-none-any.whl" }, { "comment_text": "", "digests": { "md5": "b3501fa1aff7727a15d64fa00c9f1aa4", "sha256": "c7eb4a9faaf9606948bd3187181aa85caf9555dd26ba9484cad31c14995c35c6" }, "downloads": -1, "filename": "myspokenlanguagedetection-5.tar.gz", "has_sig": false, "md5_digest": "b3501fa1aff7727a15d64fa00c9f1aa4", "packagetype": "sdist", "python_version": "source", "requires_python": null, "size": 3696, "upload_time": "2019-02-05T08:25:31", "url": "https://files.pythonhosted.org/packages/71/b6/31426eff7a7bc02b0b990378ecbfd690ce9ab98af38220cc57f535f5ae7e/myspokenlanguagedetection-5.tar.gz" } ] }