{"corpus_id":65045824,"paper_sha":"0a5a797b4affe10457dc61b062fba3a860d159f5","doi":"10.1016/J.PROCS.2017.10.024","arxiv_id":null,"pmid":null,"pmcid":null,"mag_id":2762491187,"dblp_id":"conf/iccsci/BarfianII17","acl_id":null,"title":"Twitter Pornography Multilingual Content Identification Based on Machine Learning","year":2017,"publication_date":null,"venue":"International Conference on Computer Science and Computational Intelligence","journal":{"name":null,"pages":"129-136","volume":null},"journal_issn":null,"journal_title":null,"publication_types":["JournalArticle"],"pubmed_pub_types":null,"s2_fields_of_study":["Linguistics","Computer Science"],"reference_count":7,"citation_count":10,"influential_citation_count":3,"is_open_access":false,"arxiv_categories":null,"arxiv_license":null,"arxiv_journal_ref":null,"mesh_headings":null,"chemicals":null,"comments_corrections":null,"source_flags":1,"s2_open_access_pdf_url":null,"s2_open_access_landing_url":null,"s2_open_access_license":null,"s2_open_access_status":null,"pmc_open_access_pdf_url":null,"pmc_open_access_landing_url":null,"pmc_open_access_license":null,"pmc_open_access_status":null,"unpaywall_open_access_pdf_url":null,"unpaywall_open_access_landing_url":null,"unpaywall_open_access_license":null,"unpaywall_open_access_status":null,"abstract":"Abstract Pornography on social media raises a lot of negative impact and affect the moral of children and teenagers. Social media used to spread pornography can have a negative impact. Thus, the spread of pornography on social media must be prevented. One of the social media which is often used as a medium pornography is Twitter. Pornography used on Twitter in the form of text and image. Among the two types of media, the text is very interesting to study because of the use of a variety of languages. In this study, the classification process will be conducted in Indonesian and English tweet and a combination of both languages. This classification uses three methods of machine learning, Decision Tree, Naive Bayes and Support Vector Machines for the purpose of comparing which method is the best in the classification process. In this study also conducted additional experiment was carried out with the aim of improving the performance in classification. The results showed that the level of accuracy is quite high. However, different grammar is a constraint that affects the accuracy of the results in the classification.","claims":[{"public_id":"cl_e0fa7d9c0d952f96918fd377575f4231","status":"active","text":"Additional experiments were carried out to improve classification performance.","confidence":0.9,"contributors":[{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["extraction"],"url":"https://sah.borca.ai/u/ezd9qvkvax"},{"id":2,"public_id":"4715169a40","public_label":"AK (4715169a40)","roles":["review"],"url":"https://sah.borca.ai/u/4715169a40"},{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["review"],"url":"https://sah.borca.ai/u/322360f1c1"}],"url":"https://sah.borca.ai/claims/cl_e0fa7d9c0d952f96918fd377575f4231"},{"public_id":"cl_7f37caa460735db0b34d338c4fa13e1c","status":"active","text":"Decision Tree, Naive Bayes, and Support Vector Machines were compared for multilingual pornography identification on Twitter using Indonesian, English, and combined-language tweets.","confidence":0.9,"contributors":[{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["extraction"],"url":"https://sah.borca.ai/u/ezd9qvkvax"},{"id":2,"public_id":"4715169a40","public_label":"AK (4715169a40)","roles":["review"],"url":"https://sah.borca.ai/u/4715169a40"},{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["review"],"url":"https://sah.borca.ai/u/322360f1c1"}],"url":"https://sah.borca.ai/claims/cl_7f37caa460735db0b34d338c4fa13e1c"},{"public_id":"cl_f15bc2599f0759e382ad4ec12a6ae304","status":"active","text":"High accuracy was achieved, but grammatical differences across languages negatively impacted accuracy.","confidence":0.85,"contributors":[{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["extraction"],"url":"https://sah.borca.ai/u/ezd9qvkvax"},{"id":2,"public_id":"4715169a40","public_label":"AK (4715169a40)","roles":["review"],"url":"https://sah.borca.ai/u/4715169a40"},{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["review"],"url":"https://sah.borca.ai/u/322360f1c1"}],"url":"https://sah.borca.ai/claims/cl_f15bc2599f0759e382ad4ec12a6ae304"}],"concepts":[{"public_id":"co_0035ad88e7959b8181576cf214275756","status":"active","name":"multilingual pornography identification","description":"The task of detecting pornographic content in tweets that may be in Indonesian, English, or a mix of both languages.","types":["task"],"aliases":[],"contributors":[{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["extraction"],"url":"https://sah.borca.ai/u/ezd9qvkvax"},{"id":2,"public_id":"4715169a40","public_label":"AK (4715169a40)","roles":["review"],"url":"https://sah.borca.ai/u/4715169a40"},{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["review"],"url":"https://sah.borca.ai/u/322360f1c1"}],"url":"https://sah.borca.ai/concepts/co_0035ad88e7959b8181576cf214275756"},{"public_id":"co_02020407e8016635da124b5e3729ac8e","status":"active","name":"grammar constraint","description":"Grammatical differences across languages that limit the classification accuracy.","types":["limitation"],"aliases":["different grammar"],"contributors":[{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["extraction"],"url":"https://sah.borca.ai/u/ezd9qvkvax"},{"id":2,"public_id":"4715169a40","public_label":"AK (4715169a40)","roles":["review"],"url":"https://sah.borca.ai/u/4715169a40"},{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["review"],"url":"https://sah.borca.ai/u/322360f1c1"}],"url":"https://sah.borca.ai/concepts/co_02020407e8016635da124b5e3729ac8e"},{"public_id":"co_0e53a10b0391002853deb826758937e6","status":"active","name":"Support Vector Machines","description":"A supervised learning model used for classification tasks in this study.","types":["method"],"aliases":[],"contributors":[{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["extraction"],"url":"https://sah.borca.ai/u/ezd9qvkvax"},{"id":2,"public_id":"4715169a40","public_label":"AK (4715169a40)","roles":["review"],"url":"https://sah.borca.ai/u/4715169a40"},{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["review"],"url":"https://sah.borca.ai/u/322360f1c1"}],"url":"https://sah.borca.ai/concepts/co_0e53a10b0391002853deb826758937e6"},{"public_id":"co_25a185d53cb61b9cc402adaf62252f58","status":"active","name":"Indonesian tweet","description":"A tweet written primarily in the Indonesian language.","types":["data"],"aliases":[],"contributors":[{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["extraction"],"url":"https://sah.borca.ai/u/ezd9qvkvax"},{"id":2,"public_id":"4715169a40","public_label":"AK (4715169a40)","roles":["review"],"url":"https://sah.borca.ai/u/4715169a40"},{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["review"],"url":"https://sah.borca.ai/u/322360f1c1"}],"url":"https://sah.borca.ai/concepts/co_25a185d53cb61b9cc402adaf62252f58"},{"public_id":"co_63ca78bdf46971efd1ddafc76ca99993","status":"active","name":"combined-language tweets","description":"Tweets that contain a mixture of Indonesian and English languages.","types":["data"],"aliases":["combination of both languages"],"contributors":[{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["extraction"],"url":"https://sah.borca.ai/u/ezd9qvkvax"},{"id":2,"public_id":"4715169a40","public_label":"AK (4715169a40)","roles":["review"],"url":"https://sah.borca.ai/u/4715169a40"},{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["review"],"url":"https://sah.borca.ai/u/322360f1c1"}],"url":"https://sah.borca.ai/concepts/co_63ca78bdf46971efd1ddafc76ca99993"},{"public_id":"co_90248f6cdc8baf4ab1da3e3788e8b09d","status":"active","name":"Decision Tree","description":"A supervised machine learning method used for classification in this study.","types":["method"],"aliases":[],"contributors":[{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["extraction"],"url":"https://sah.borca.ai/u/ezd9qvkvax"},{"id":2,"public_id":"4715169a40","public_label":"AK (4715169a40)","roles":["review"],"url":"https://sah.borca.ai/u/4715169a40"},{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["review"],"url":"https://sah.borca.ai/u/322360f1c1"}],"url":"https://sah.borca.ai/concepts/co_90248f6cdc8baf4ab1da3e3788e8b09d"},{"public_id":"co_a94bc9445c587ee4ab821e7e8985eb07","status":"active","name":"English tweet","description":"A tweet written primarily in the English language.","types":["data"],"aliases":[],"contributors":[{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["extraction"],"url":"https://sah.borca.ai/u/ezd9qvkvax"},{"id":2,"public_id":"4715169a40","public_label":"AK (4715169a40)","roles":["review"],"url":"https://sah.borca.ai/u/4715169a40"},{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["review"],"url":"https://sah.borca.ai/u/322360f1c1"}],"url":"https://sah.borca.ai/concepts/co_a94bc9445c587ee4ab821e7e8985eb07"},{"public_id":"co_b1ed3dec53ce0b07ce9aa50154134dc2","status":"active","name":"accuracy","description":"The evaluation metric used to measure the correctness of classification predictions.","types":["metric"],"aliases":[],"contributors":[{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["extraction"],"url":"https://sah.borca.ai/u/ezd9qvkvax"},{"id":2,"public_id":"4715169a40","public_label":"AK (4715169a40)","roles":["review"],"url":"https://sah.borca.ai/u/4715169a40"},{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["review"],"url":"https://sah.borca.ai/u/322360f1c1"}],"url":"https://sah.borca.ai/concepts/co_b1ed3dec53ce0b07ce9aa50154134dc2"},{"public_id":"co_cc2b8845d1af51a6ce096d15b53e4f8d","status":"active","name":"Naive Bayes","description":"A probabilistic machine learning classifier used for text classification in this study.","types":["method"],"aliases":[],"contributors":[{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["extraction"],"url":"https://sah.borca.ai/u/ezd9qvkvax"},{"id":2,"public_id":"4715169a40","public_label":"AK (4715169a40)","roles":["review"],"url":"https://sah.borca.ai/u/4715169a40"},{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["review"],"url":"https://sah.borca.ai/u/322360f1c1"}],"url":"https://sah.borca.ai/concepts/co_cc2b8845d1af51a6ce096d15b53e4f8d"},{"public_id":"co_e51fdff9d5b2918961857f3443f23a25","status":"active","name":"additional experiment","description":"An extra experimental procedure conducted with the aim of improving classification performance.","types":["procedure"],"aliases":[],"contributors":[{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["extraction"],"url":"https://sah.borca.ai/u/ezd9qvkvax"},{"id":2,"public_id":"4715169a40","public_label":"AK (4715169a40)","roles":["review"],"url":"https://sah.borca.ai/u/4715169a40"},{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["review"],"url":"https://sah.borca.ai/u/322360f1c1"}],"url":"https://sah.borca.ai/concepts/co_e51fdff9d5b2918961857f3443f23a25"}],"external_ids":{"DOI":"10.1016/J.PROCS.2017.10.024","ArXiv":null,"PubMed":null,"PubMedCentral":null,"MAG":2762491187,"DBLP":"conf/iccsci/BarfianII17","ACL":null},"open_access":{"is_open_access":false,"pdf_url":null,"landing_url":"https://sah.borca.ai/papers/65045824","source":null,"pdf_url_source":null,"license":null,"reason":"pdf_url_not_indexed"},"reference_availability":{"status":"available","references_indexed":true,"full_text_available":false,"full_text_source":null,"count_basis":"semantic_scholar_metadata","extraction_status":"not_applicable","reason":null},"source":{"provider":"episteme2","base_corpus":"semantic_scholar_dump","freshness_mode":"unknown","basis":["semantic_scholar_metadata","postgres_metadata"],"limits":["paper metadata is based on indexed upstream scholarly datasets","claims and concepts are available only for extracted papers","absence of claims or concepts means no extracted graph data is available in this response"],"status":"available","degraded":false,"degraded_reasons":[],"diagnostics":{"status":"available","degraded":false,"degraded_reasons":[],"metadata_status":"available","graph_status":"available","abstract_status":"available"},"source_flags":1},"paper_id":631412,"paper_uid":"c383a9b4-6c26-407e-a434-4d2e26589670","canonical_identity":{"paper_id":631412,"paper_uid":"c383a9b4-6c26-407e-a434-4d2e26589670","identity_status":"available","lookup_basis":"semantic_scholar_external_id","compatibility_path":"corpus_id"},"url":"https://sah.borca.ai/papers/65045824"}