<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Text Explorer - Need help with Topic Analysis in Discussions</title>
    <link>https://community.jmp.com/t5/Discussions/Text-Explorer-Need-help-with-Topic-Analysis/m-p/50057#M28478</link>
    <description>&lt;P&gt;Looks like a good approach - if anyone out there knows a quantifiable way to choose "cut -off" points for relevance of each topic vecto that would be great&lt;/P&gt;</description>
    <pubDate>Tue, 23 Jan 2018 18:20:30 GMT</pubDate>
    <dc:creator>ar2</dc:creator>
    <dc:date>2018-01-23T18:20:30Z</dc:date>
    <item>
      <title>Text Explorer - Need help with Topic Analysis</title>
      <link>https://community.jmp.com/t5/Discussions/Text-Explorer-Need-help-with-Topic-Analysis/m-p/50019#M28464</link>
      <description>&lt;P&gt;Dear all - Am using Text explorer to analyse some interesting "incident" data in transport environment. I am Using Topic Analysis and have identified about 15 sensible "topics". Is it possible to find out how many documents in my sample set "include" each topic - haven't found a way to do that.&lt;/P&gt;&lt;P&gt;Any guidance welcome&lt;/P&gt;&lt;P&gt;Thanks&lt;/P&gt;</description>
      <pubDate>Tue, 23 Jan 2018 08:52:24 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/Text-Explorer-Need-help-with-Topic-Analysis/m-p/50019#M28464</guid>
      <dc:creator>ar2</dc:creator>
      <dc:date>2018-01-23T08:52:24Z</dc:date>
    </item>
    <item>
      <title>Re: Text Explorer - Need help with Topic Analysis</title>
      <link>https://community.jmp.com/t5/Discussions/Text-Explorer-Need-help-with-Topic-Analysis/m-p/50049#M28476</link>
      <description>&lt;P&gt;You should be able to use the document topic vectors.&amp;nbsp; Maybe someone knows of a quantifyiable way to choose the decision points for each vector, I have done&amp;nbsp;that visually and by checking documents:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;PRE&gt;&lt;CODE class=" language-jsl"&gt;Names default to here( 1 );

dt = Open( "$Sample_data/Aircraft Incidents.jmp" );

te = dt &amp;lt;&amp;lt; Text Explorer(
	Text Columns( :Final Narrative ),
	Latent Semantic Analysis(
		1,
		Maximum Number of Terms( 2128 ),
		Minimum Term Frequency( 10 ),
		Weighting( "TF IDF" ),
		Number of Singular Vectors( 100 ),
		Centering and Scaling( "Centered and Scaled" )
	),
	Topic Analysis( 1, Number of Topics( 10 ) ),
	Tokenizing( "Basic Words" ),
	Language( "English" ),
	SendToReport(
		Dispatch( {}, "Term and Phrase Lists", OutlineBox, {Close( 1 )} ),
		Dispatch( {}, "SVD Plots", OutlineBox, {Close( 1 )} ),
		Dispatch( {}, "Topic Terms", OutlineBox, {Close( 1 )} ),
		Dispatch( {}, "Topic Scores Plots", OutlineBox, {Close( 0 )} )
	)
);

//Save the topic vectors
te &amp;lt;&amp;lt; Save Document Topic Vectors;

//Decide what values relate to documents that contain the topic:
dt &amp;lt;&amp;lt; Distribution(
	Continuous Distribution( Column( :Topic 1 ) ),
	Continuous Distribution( Column( :Topic 2 ) ),
	Continuous Distribution( Column( :Topic 3 ) ),
	Continuous Distribution( Column( :Topic 4 ) ),
	Continuous Distribution( Column( :Topic 5 ) ),
	Continuous Distribution( Column( :Topic 6 ) ),
	Continuous Distribution( Column( :Topic 7 ) ),
	Continuous Distribution( Column( :Topic 8 ) ),
	Continuous Distribution( Column( :Topic 9 ) ),
	Continuous Distribution( Column( :Topic 10 ) )
);

//Select rows with topic 1
dt &amp;lt;&amp;lt; Select where( :Topic 1 &amp;gt; 5 );

//Or, count rows with topic 1:
Sum( (Column( dt, "Topic 1" ) &amp;lt;&amp;lt; Get values) &amp;gt; 5 );
//returns 169&lt;/CODE&gt;&lt;/PRE&gt;</description>
      <pubDate>Tue, 23 Jan 2018 17:15:50 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/Text-Explorer-Need-help-with-Topic-Analysis/m-p/50049#M28476</guid>
      <dc:creator>ih</dc:creator>
      <dc:date>2018-01-23T17:15:50Z</dc:date>
    </item>
    <item>
      <title>Re: Text Explorer - Need help with Topic Analysis</title>
      <link>https://community.jmp.com/t5/Discussions/Text-Explorer-Need-help-with-Topic-Analysis/m-p/50057#M28478</link>
      <description>&lt;P&gt;Looks like a good approach - if anyone out there knows a quantifiable way to choose "cut -off" points for relevance of each topic vecto that would be great&lt;/P&gt;</description>
      <pubDate>Tue, 23 Jan 2018 18:20:30 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/Text-Explorer-Need-help-with-Topic-Analysis/m-p/50057#M28478</guid>
      <dc:creator>ar2</dc:creator>
      <dc:date>2018-01-23T18:20:30Z</dc:date>
    </item>
  </channel>
</rss>

