Page tree

Versions Compared

Key

  • This line was added.
  • This line was removed.
  • Formatting was changed.

...

Code Block
languagexml
titleExample statistic XML file
<?xml version="1.0"?>
<statistics>
  <taskGuid>{792b3c27-0f48-4eaf-aaa3-dbdffd4da62b}</taskGuid>  	<!-- The unique guid of the task -->
  <taskName>testpaketneu TRANSLATE-485</taskName>  				<!-- The textual task name -->
  <filtered>													<!-- A list of set filters, if no filter is set the filtered tag is empty, the filters influences all counters -->
    <filter>transitLockedForRefMat</filter>
  </filtered>
  <segmentCount>234</segmentCount>								<!-- The overall segment count of the task -->
  <segmentCountEditable>22</segmentCountEditable>				<!-- How many segments are editable in the task -->
  <import>														<!-- The import section contains the stats directly after import -->
    <files>														<!-- In the files section for each file in task one section is created -->
      <file>
        <fileName>MyNiceFile.ENG.transit</fileName>				
        <fileId>3539</fileId>
        <fields>
          <field>												<!-- foreach field one stat block is created, these are mainly source and target -->
            <fieldName>source</fieldName>
            <charFoundCount>1316</charFoundCount>				<!-- counts all chars in this file segments with at least one blue (found) term -->
            <charNotFoundCount>801</charNotFoundCount>			<!-- counts all chars in this file segments with at least one red (not found) term -->
            <wordFoundCount>195</wordFoundCount>				<!-- counts all words in this file segments with at least one blue (found) term -->
            <wordNotFoundCount>117</wordNotFoundCount>			<!-- counts all words in this file segments with at least one red (not found) term -->
            <termFoundCount>31</termFoundCount>					<!-- counts all blue (found) terms in this file -->
            <termNotFoundCount>11</termNotFoundCount>			<!-- counts all red (not found) terms in this file -->
																<!-- segments with red and blue terms are counted twice! -->
            <segmentsPerFile>117</segmentsPerFile>				<!-- counts all segments in this file -->
            <segmentsPerFileFound>24</segmentsPerFileFound>		<!-- counts all segments in this file with blue (found) terms -->
            <segmentsPerFileNotFound>11</segmentsPerFileNotFound>	<!-- counts all segments in this file with red (not found) terms -->
            <targetCharFoundCount>1301</targetCharFoundCount>   <!-- counts all chars in the target field where the source contains blue (found) terms -->
            <targetCharNotFoundCount>839</targetCharNotFoundCount>	<!-- counts all chars in the target field where the source contains red (not found) terms -->
            <targetSegmentsPerFileFound>24</targetSegmentsPerFileFound>	<!-- same value as segmentsPerFileFound -->
            <targetSegmentsPerFileNotFound>11</targetSegmentsPerFileNotFound>	<!-- same value as segmentsPerFileNotFound -->
          </field>
          <field>												<!-- same statistics as described above, only for the target field -->
            <fieldName>target</fieldName>
            <charFoundCount>2875</charFoundCount>
            <charNotFoundCount>0</charNotFoundCount>
            <wordFoundCount>478</wordFoundCount>
            <wordNotFoundCount>0</wordNotFoundCount>
            <termFoundCount>59</termFoundCount>
            <termNotFoundCount>0</termNotFoundCount>
            <segmentsPerFile>117</segmentsPerFile>
            <segmentsPerFileFound>45</segmentsPerFileFound>
            <segmentsPerFileNotFound>0</segmentsPerFileNotFound>
          </field>
        </fields>
      </file>
      <file>
		<!-- [...] here would be the next file -->
      </file>        
    </files>
    <fields>													<!-- The fields section contains the sum of the statistic values over all files -->
      <field>
        <fieldName>source</fieldName>
        <taskCharFoundCount>2632</taskCharFoundCount>
        <taskCharNotFoundCount>1602</taskCharNotFoundCount>
        <taskWordFoundCount>390</taskWordFoundCount>
        <taskWordNotFoundCount>234</taskWordNotFoundCount>
        <taskTermFoundCount>62</taskTermFoundCount>
        <taskTermNotFoundCount>22</taskTermNotFoundCount>
        <taskTargetCharFoundCount>2602</taskTargetCharFoundCount>
        <taskTargetCharNotFoundCount>1678</taskTargetCharNotFoundCount>
        <taskTargetWordFoundCount>430</taskTargetWordFoundCount>
        <taskTargetWordNotFoundCount>294</taskTargetWordNotFoundCount>
        <taskTargetSegmentsPerFileFound>48</taskTargetSegmentsPerFileFound>
        <taskTargetSegmentsPerFileNotFound>22</taskTargetSegmentsPerFileNotFound>
      </field>
      <field>
        <fieldName>target</fieldName>
        <taskCharFoundCount>5750</taskCharFoundCount>
        <taskCharNotFoundCount>0</taskCharNotFoundCount>
        <taskWordFoundCount>956</taskWordFoundCount>
        <taskWordNotFoundCount>0</taskWordNotFoundCount>
        <taskTermFoundCount>118</taskTermFoundCount>
        <taskTermNotFoundCount>0</taskTermNotFoundCount>
      </field>
    </fields>
  </import>
  <export>														<!-- The export section contains the stats after triggered export -->
    <!-- [...] here would be the statistics at export -->
  </export>
</statistics>

Debugging

Adding the following line to yoir installation.ini enables debugging output for SegmentStatistics Plugin.

  runtimeOptions.debug.plugin.SegmentStatistics = 1

Enabled debugging for segment statistics does:

  • create segmentstatistics-export files without a timestamp in filename, this makes checking file content easier.
  • returns XML files formatted (intendation)
  • writes in additon a CSV file with the XLS content
  • writes to the error log when writing XLS is finished