<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: find events that contain non english words in Splunk Search</title>
    <link>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/602666#M209776</link>
    <description>&lt;P&gt;&lt;a href="https://community.splunk.com/t5/user/viewprofilepage/user-id/217339"&gt;@indeed_2000&lt;/a&gt;&amp;nbsp;- The regex does work in the event that you provided.&lt;/P&gt;&lt;P&gt;&lt;A href="https://regex101.com/r/sG3IdX/1" target="_blank"&gt;https://regex101.com/r/sG3IdX/1&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="VatsalJagani_0-1655825720128.png" style="width: 574px;"&gt;&lt;img src="https://community.splunk.com/t5/image/serverpage/image-id/20212iAFB319ABFD2BDF17/image-dimensions/574x122?v=v2" width="574" height="122" role="button" title="VatsalJagani_0-1655825720128.png" alt="VatsalJagani_0-1655825720128.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Tue, 21 Jun 2022 15:35:41 GMT</pubDate>
    <dc:creator>VatsalJagani</dc:creator>
    <dc:date>2022-06-21T15:35:41Z</dc:date>
    <item>
      <title>How can I find events that contain non english words?</title>
      <link>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/571048#M198987</link>
      <description>&lt;P&gt;Hi&lt;/P&gt;
&lt;P&gt;how can I find events that contain non english words?&lt;/P&gt;
&lt;P&gt;e.g i have log file that some lines contain germany or arabic words, how can i recognize these lines?&lt;/P&gt;
&lt;P&gt;thanks&lt;/P&gt;</description>
      <pubDate>Tue, 21 Jun 2022 15:44:40 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/571048#M198987</guid>
      <dc:creator>indeed_2000</dc:creator>
      <dc:date>2022-06-21T15:44:40Z</dc:date>
    </item>
    <item>
      <title>Re: find events that contain non english words</title>
      <link>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/602502#M209724</link>
      <description>&lt;P&gt;I can't help you too much for non-English words in ASCII character sets, but for languages with characters in the unicode set you could consider using Unicode Categories:&lt;/P&gt;&lt;P&gt;&lt;A href="https://www.regular-expressions.info/unicode.html" target="_blank"&gt;https://www.regular-expressions.info/unicode.html&lt;/A&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;STRONG&gt;Quick example&lt;/STRONG&gt;:&lt;/P&gt;&lt;P&gt;| makeresults | eval text="كلب means dog according to google" | rex field=text "(?&amp;lt;capturetext&amp;gt;\p{Arabic}*)" | table text capturetext&lt;/P&gt;</description>
      <pubDate>Tue, 21 Jun 2022 03:35:30 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/602502#M209724</guid>
      <dc:creator>DanielMustaine</dc:creator>
      <dc:date>2022-06-21T03:35:30Z</dc:date>
    </item>
    <item>
      <title>Re: find events that contain non english words</title>
      <link>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/602532#M209737</link>
      <description>&lt;P&gt;&lt;a href="https://community.splunk.com/t5/user/viewprofilepage/user-id/217339"&gt;@indeed_2000&lt;/a&gt;&amp;nbsp;- Try the&amp;nbsp;below search, it will find anything that contains anything other than desired character set.&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;&amp;lt;your base search&amp;gt;
| rex _raw="[^\x00-\x7F]"&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I hope this helps!!!&lt;/P&gt;</description>
      <pubDate>Tue, 21 Jun 2022 06:28:19 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/602532#M209737</guid>
      <dc:creator>VatsalJagani</dc:creator>
      <dc:date>2022-06-21T06:28:19Z</dc:date>
    </item>
    <item>
      <title>Re: find events that contain non english words</title>
      <link>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/602658#M209771</link>
      <description>&lt;P&gt;&lt;a href="https://community.splunk.com/t5/user/viewprofilepage/user-id/247043"&gt;@DanielMustaine&lt;/a&gt;&amp;nbsp;not work on this&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P data-unlink="true"&gt;2022-06-20 11:16:10,381 INFO [APP] log in : 38773763@#123@دالكي&amp;nbsp;&lt;/P&gt;&lt;P&gt;any idea?&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Tue, 21 Jun 2022 14:58:29 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/602658#M209771</guid>
      <dc:creator>indeed_2000</dc:creator>
      <dc:date>2022-06-21T14:58:29Z</dc:date>
    </item>
    <item>
      <title>Re: find events that contain non english words</title>
      <link>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/602661#M209773</link>
      <description>&lt;P&gt;&lt;a href="https://community.splunk.com/t5/user/viewprofilepage/user-id/93915"&gt;@VatsalJagani&lt;/a&gt;&amp;nbsp;not work!&lt;/P&gt;</description>
      <pubDate>Tue, 21 Jun 2022 15:03:40 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/602661#M209773</guid>
      <dc:creator>indeed_2000</dc:creator>
      <dc:date>2022-06-21T15:03:40Z</dc:date>
    </item>
    <item>
      <title>Re: find events that contain non english words</title>
      <link>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/602666#M209776</link>
      <description>&lt;P&gt;&lt;a href="https://community.splunk.com/t5/user/viewprofilepage/user-id/217339"&gt;@indeed_2000&lt;/a&gt;&amp;nbsp;- The regex does work in the event that you provided.&lt;/P&gt;&lt;P&gt;&lt;A href="https://regex101.com/r/sG3IdX/1" target="_blank"&gt;https://regex101.com/r/sG3IdX/1&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="VatsalJagani_0-1655825720128.png" style="width: 574px;"&gt;&lt;img src="https://community.splunk.com/t5/image/serverpage/image-id/20212iAFB319ABFD2BDF17/image-dimensions/574x122?v=v2" width="574" height="122" role="button" title="VatsalJagani_0-1655825720128.png" alt="VatsalJagani_0-1655825720128.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Tue, 21 Jun 2022 15:35:41 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/602666#M209776</guid>
      <dc:creator>VatsalJagani</dc:creator>
      <dc:date>2022-06-21T15:35:41Z</dc:date>
    </item>
    <item>
      <title>Re: find events that contain non english words</title>
      <link>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/602672#M209778</link>
      <description>&lt;P&gt;Consider each character as separate, in this line i only have one non English word!&lt;/P&gt;&lt;P&gt;Excpected output:&lt;/P&gt;&lt;P&gt;| table NonEnglish&amp;nbsp;&lt;/P&gt;&lt;P&gt;دالكي&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Any idea?&lt;/P&gt;</description>
      <pubDate>Tue, 21 Jun 2022 16:01:01 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/602672#M209778</guid>
      <dc:creator>indeed_2000</dc:creator>
      <dc:date>2022-06-21T16:01:01Z</dc:date>
    </item>
    <item>
      <title>Re: find events that contain non english words</title>
      <link>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/602896#M209838</link>
      <description>&lt;P&gt;Hey, try this:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;| makeresults | eval text="2022-06-20 11:16:10,381 INFO [APP] log in : 38773763@#123@دالكي " |rex field=text "(?&amp;lt;capturetext&amp;gt;[\p{Arabic}]+)" | table text capturetext&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Alternatively using&amp;nbsp;VatsalJagani's Regex (which will match all non-ASCII characters so get you the Russian sets etc.) like:&lt;/P&gt;&lt;P&gt;| makeresults | eval text="2022-06-20 11:16:10,381 INFO [APP] log in : 38773763@#123@دالكي " |rex field=text "(?&amp;lt;capturetext&amp;gt;[^\x00-\x7F]+)" | table text capturetext&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;If you know which field the non-standard characters will be in make sure to sub that fieldname into field=xxx. Otherwise, and it will perform poorly, but you can look over the whole log with field=_raw.&lt;/P&gt;</description>
      <pubDate>Thu, 23 Jun 2022 00:47:25 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/602896#M209838</guid>
      <dc:creator>DanielMustaine</dc:creator>
      <dc:date>2022-06-23T00:47:25Z</dc:date>
    </item>
    <item>
      <title>Re: find events that contain non english words</title>
      <link>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/602910#M209841</link>
      <description>&lt;P&gt;Still not work as expected, if more that one non english word exist on each line i expect consider them.&lt;/P&gt;&lt;P&gt;e.g.&lt;/P&gt;&lt;P&gt;Expected result for below line:&amp;nbsp;دالكي&amp;nbsp;&amp;nbsp;هلت&amp;nbsp;&lt;/P&gt;&lt;P data-unlink="true"&gt;"2022-06-20 11:16:10,381 INFO [APP] log in : 38773763@#123@دالكي&amp;nbsp;&amp;nbsp;هلت "&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 23 Jun 2022 05:30:58 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/602910#M209841</guid>
      <dc:creator>indeed_2000</dc:creator>
      <dc:date>2022-06-23T05:30:58Z</dc:date>
    </item>
    <item>
      <title>Re: find events that contain non english words</title>
      <link>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/603101#M209888</link>
      <description>&lt;P&gt;Try this:&lt;/P&gt;&lt;P&gt;| rex max_match=0 field=text "(?&amp;lt;capturetext&amp;gt;\p{Arabic}[\p{Arabic}\s]+)"&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;This one I didn't have as much success with but not much time to play.&lt;/P&gt;&lt;P&gt;| rex field=text max_match=0 "(?&amp;lt;capturetext&amp;gt;[^\x00-\x7F][^\x00-\x7F\s]+)"&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Max match will also mean that multiple phrases in one log are pulled into capturetext as new multivalue field values.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 24 Jun 2022 03:30:41 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/603101#M209888</guid>
      <dc:creator>DanielMustaine</dc:creator>
      <dc:date>2022-06-24T03:30:41Z</dc:date>
    </item>
    <item>
      <title>Re: find events that contain non english words</title>
      <link>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/603227#M209931</link>
      <description>&lt;P&gt;is there anyway to consider whole non english charecter in each line as one extraction?&lt;/P&gt;&lt;P data-unlink="true"&gt;2022-06-20 11:16:10,381 INFO [APP] log in : 38773763@#123@دالكي&amp;nbsp;&amp;nbsp;string تست&lt;/P&gt;&lt;P data-unlink="true"&gt;&amp;nbsp;&lt;/P&gt;&lt;P data-unlink="true"&gt;exception result:&lt;/P&gt;&lt;P data-unlink="true"&gt;تست&amp;nbsp;دالكي&amp;nbsp;&amp;nbsp;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Sat, 25 Jun 2022 03:38:25 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/603227#M209931</guid>
      <dc:creator>indeed_2000</dc:creator>
      <dc:date>2022-06-25T03:38:25Z</dc:date>
    </item>
    <item>
      <title>Re: find events that contain non english words</title>
      <link>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/603253#M209940</link>
      <description>&lt;P&gt;Just remember that as it was stated before it has nothing to do with language as such. It will not capture, for example, a sentence "moja matka jada pomidory" ("my mother eats tomatoes" in Polish) even though it's clearly not an English sentence.&lt;/P&gt;</description>
      <pubDate>Sat, 25 Jun 2022 09:29:47 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Splunk-Search/How-can-I-find-events-that-contain-non-english-words/m-p/603253#M209940</guid>
      <dc:creator>PickleRick</dc:creator>
      <dc:date>2022-06-25T09:29:47Z</dc:date>
    </item>
  </channel>
</rss>

