<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic How to recognize Chinese characters in a string？ in Discussions</title>
    <link>https://community.jmp.com/t5/Discussions/How-to-recognize-Chinese-characters-in-a-string/m-p/654684#M84384</link>
    <description>&lt;P class=""&gt;&lt;SPAN class=""&gt;Hi,I have a problem on regex,&lt;/SPAN&gt;&lt;/P&gt;&lt;P class=""&gt;&lt;SPAN class=""&gt;For example:&lt;BR /&gt;&lt;/SPAN&gt;&lt;/P&gt;&lt;PRE&gt;&lt;CODE class=" language-jsl"&gt;regex("零件2305wu","[\u4e00-\u9fa5]+")&lt;/CODE&gt;&lt;/PRE&gt;&lt;P class=""&gt;I want to extract the "零件" but the output is "2305".&lt;/P&gt;&lt;P class=""&gt;Thanks!&lt;/P&gt;</description>
    <pubDate>Mon, 03 Jul 2023 08:11:36 GMT</pubDate>
    <dc:creator>lehaofeng</dc:creator>
    <dc:date>2023-07-03T08:11:36Z</dc:date>
    <item>
      <title>How to recognize Chinese characters in a string？</title>
      <link>https://community.jmp.com/t5/Discussions/How-to-recognize-Chinese-characters-in-a-string/m-p/654684#M84384</link>
      <description>&lt;P class=""&gt;&lt;SPAN class=""&gt;Hi,I have a problem on regex,&lt;/SPAN&gt;&lt;/P&gt;&lt;P class=""&gt;&lt;SPAN class=""&gt;For example:&lt;BR /&gt;&lt;/SPAN&gt;&lt;/P&gt;&lt;PRE&gt;&lt;CODE class=" language-jsl"&gt;regex("零件2305wu","[\u4e00-\u9fa5]+")&lt;/CODE&gt;&lt;/PRE&gt;&lt;P class=""&gt;I want to extract the "零件" but the output is "2305".&lt;/P&gt;&lt;P class=""&gt;Thanks!&lt;/P&gt;</description>
      <pubDate>Mon, 03 Jul 2023 08:11:36 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/How-to-recognize-Chinese-characters-in-a-string/m-p/654684#M84384</guid>
      <dc:creator>lehaofeng</dc:creator>
      <dc:date>2023-07-03T08:11:36Z</dc:date>
    </item>
    <item>
      <title>Re: How to recognize Chinese characters in a string？</title>
      <link>https://community.jmp.com/t5/Discussions/How-to-recognize-Chinese-characters-in-a-string/m-p/654705#M84385</link>
      <description>&lt;P&gt;It seems to have been found.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;regex("零件2305wu","[^\x00-\xff]+")&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;PRE&gt;&lt;CODE class=" language-jsl"&gt;&lt;/CODE&gt;&lt;/PRE&gt;</description>
      <pubDate>Mon, 03 Jul 2023 08:59:44 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/How-to-recognize-Chinese-characters-in-a-string/m-p/654705#M84385</guid>
      <dc:creator>lehaofeng</dc:creator>
      <dc:date>2023-07-03T08:59:44Z</dc:date>
    </item>
    <item>
      <title>Re: How to recognize Chinese characters in a string？</title>
      <link>https://community.jmp.com/t5/Discussions/How-to-recognize-Chinese-characters-in-a-string/m-p/654820#M84392</link>
      <description>&lt;P&gt;Nice! I was going to suggest similar,&lt;/P&gt;
&lt;PRE&gt;&lt;CODE class=" language-jsl"&gt;regex("零件2305wu","[^\x01-\x7f]+")&lt;/CODE&gt;&lt;/PRE&gt;
&lt;P&gt;The characters from x00 to x7F are ASCII; x00 might make a note in the log, so maybe start at x01. Characters from x80 to xFF are similar to ASCII and you might want to leave them out as well. Outside that range is non-ASCII Unicode.&lt;/P&gt;
&lt;P&gt;The [ square brackets ] make a character set, and the leading ^ means &lt;EM&gt;not in this set&lt;/EM&gt;. The minus means a range. The + means one or more.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 03 Jul 2023 14:01:57 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/How-to-recognize-Chinese-characters-in-a-string/m-p/654820#M84392</guid>
      <dc:creator>Craige_Hales</dc:creator>
      <dc:date>2023-07-03T14:01:57Z</dc:date>
    </item>
    <item>
      <title>Re: How to recognize Chinese characters in a string？</title>
      <link>https://community.jmp.com/t5/Discussions/How-to-recognize-Chinese-characters-in-a-string/m-p/751898#M93316</link>
      <description>&lt;PRE&gt;&lt;CODE class=" language-jsl"&gt;tx=regex("零件2305wu","([一-﨩]{0,})");&lt;/CODE&gt;&lt;/PRE&gt;&lt;UL&gt;&lt;LI&gt;&lt;P class=""&gt;Is this possible, but reasonable?&lt;/P&gt;&lt;/LI&gt;&lt;/UL&gt;&lt;P&gt;Thanks Experts!&lt;/P&gt;</description>
      <pubDate>Fri, 03 May 2024 10:12:25 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/How-to-recognize-Chinese-characters-in-a-string/m-p/751898#M93316</guid>
      <dc:creator>lala</dc:creator>
      <dc:date>2024-05-03T10:12:25Z</dc:date>
    </item>
    <item>
      <title>Re: How to recognize Chinese characters in a string？</title>
      <link>https://community.jmp.com/t5/Discussions/How-to-recognize-Chinese-characters-in-a-string/m-p/751950#M93325</link>
      <description>&lt;P&gt;&lt;A href="https://www.google.com/search?q=unicode+%E4%B8%80" target="_self"&gt;https://www.google.com/search?q=unicode+%E4%B8%80&lt;/A&gt;&amp;nbsp; (4E00) is smaller than&lt;/P&gt;
&lt;P&gt;&lt;A href="https://www.google.com/search?q=unicode+%EF%A8%A9" target="_self"&gt;https://www.google.com/search?q=unicode+%EF%A8%A9&lt;/A&gt;&amp;nbsp; (FA29) so it should be a valid range. It matches about 11/16 of the Unicode characters.&lt;/P&gt;
&lt;P&gt;{0,} means zero or more, just like *&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;it appears to work, keeping the first two characters and rejecting the last 6 characters.&lt;/P&gt;</description>
      <pubDate>Fri, 03 May 2024 13:31:35 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/How-to-recognize-Chinese-characters-in-a-string/m-p/751950#M93325</guid>
      <dc:creator>Craige_Hales</dc:creator>
      <dc:date>2024-05-03T13:31:35Z</dc:date>
    </item>
  </channel>
</rss>

