<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xml:lang="en" lang="en" xmlns="http://www.w3.org/1999/xhtml">
  <head runat="server">
    <!-- PageID 382 - published by RedDot 7.5 - 7.5.1.69 - 22111 -->
    <META name="PublicArticle" content="True" />
    <META http-equiv="Content-Type" content="text/html; charset=utf-8" />
    <META name="keywords" />
    <META name="summary" />
    <META name="product" content="apdata,apendpt,apendptdl" />
    <META name="version" content="v83" />
    <META name="book" content="Data Manager Help 8.3" />
    <title>Patterns &amp; Phrases</title>
    <!--Loading the 2016 fonts.-->
    <script type="text/javascript" src="//fast.fonts.net/jsapi/c504d579-e135-4f75-8335-4906f6c6ce67.js"></script>
    <!--Library content styles.-->
    <link rel="StyleSheet" href="https://help.forcepoint.com/docs/ni/assets/css/help2016.css" type="text/css" media="all" />
    <!--2016 font support -->
    <link type="text/css" rel="stylesheet" href="//fast.fonts.net/cssapi/c504d579-e135-4f75-8335-4906f6c6ce67.css" />
  </head>
  <body>
    <!--googleoff: all-->
    <a href="https://www.forcepoint.com">
      <img class="logo" alt="Forcepoint logo" src="https://help.forcepoint.com/docs/ni/assets/logo1.png" />
    </a>
    <div class="extLinksContainer">
      <a class="extLinks" href="http://help.forcepoint.com/docs/technical-library.aspx">Technical Library</a> | <a class="extLinks" href="https://help.forcepoint.com/content/support.aspx?intcmp=nav-mm-support#/?intcmp=nav-mm-support">Support</a></div>
    <!--
		<wsApp:UserAccess ID="useraccess1" runat="server" IsSecure="False" />
		-->
    <div class="spacer1"></div>
    <br />
    <!-- New Navigation DIV -->
    <div class="TL_nav" style="text-align: left;">
      <table cellspacing="0" class="toolBarTable" summary="">
        <!-- End New Navigation DIV -->
        <tr>
          <td>
            <!-- New Go To TOC -->
            <a href="toc.aspx"><img src="images/toc.png" alt="Go to the table of contents" border="0" /></a>
            <!-- End Go To TOC -->
          </td>
          <td>
            <!-- New Previous -->
            <a href="classifier%20details.aspx"><img src="images/prev.png" alt="Go to the previous page" border="0" /></a>
            <!-- End New Previous -->
          </td>
          <td>
            <!-- New Next (Active) -->
            <a href="Add%20Pattern.aspx"><img src="images/next.png" alt="Go to the next page" border="0" /></a>
            <!-- End New Next (Active) -->
          </td>
          <td>
            <!-- New PDF -->
            <a href="Data%20Security%208.3.pdf"><img src="images/pdf.png" alt="View or print as PDF" border="0" /></a>
            <!-- End New PDF -->
          </td>
          <!--Start JR breadcrumbs -->
          <td width="20px"></td>
          <td>
            <div class="WebWorks_Breadcrumbs" style="text-align: left;">
              <a class="WebWorks_Breadcrumb_Link" href="content%20classifiers.aspx">Classifying Content</a> &gt; Patterns &amp; Phrases</div>
          </td>
          <!--End JR breadcrumbs -->
        </tr>
      </table>
    </div>
    <!--googleon: all-->
    <div>
      <div class="N1H-Heading1"><a name="743205">Patterns &amp; Phrases</a></div>
      <div class="IN-TopicInfo"><a name="772856">Administrator Help | TRITON&nbsp;AP-DATA | Version 8.3.x</a></div>
      <table class="DropListTable" style="text-align: left" border="0" cellpadding="1" cellspacing="0" summary="">
        <caption></caption>
        <tr>
          <td style="padding-bottom: 3.5pt; padding-left: 6pt; padding-right: 6pt; padding-top: 4.5pt; vertical-align: top">
            <div class="DLC-ClosedDynamicList" onclick="WebWorks_ToggleDIV(WebWorksRootPath, &quot;wwdd743208&quot;);"><a name="743208">Related topics:</a><script type="text/javascript" language="JavaScript1.2">WebWorks_WriteArrow(WebWorksRootPath, "wwdd743208", false);</script></div>
            <script type="text/javascript" language="JavaScript1.2">WebWorks_WriteDIVOpen("wwdd743208", false);</script>
            <div class="B1-Bullet1_outer" style="margin-left: 0pt">
              <table border="0" cellspacing="0" cellpadding="0" summary="" role="presentation">
                <tr style="vertical-align: baseline">
                  <td>
                    <div class="B1-Bullet1_inner" style="width: 18pt; white-space: nowrap">
                      <img src="b1.png" alt="*" border="0" width="8" height="8" />
                    </div>
                  </td>
                  <td width="100%">
                    <div class="B1-Bullet1_inner"><span class="LEM-LinkEmphasis"><a href="Add%20Pattern.aspx" title="Adding or editing a regular expression classifier" name="743212">Adding or editing a regular expression classifier</a></span></div>
                  </td>
                </tr>
              </table>
            </div>
            <div class="B1-Bullet1_outer" style="margin-left: 0pt">
              <table border="0" cellspacing="0" cellpadding="0" summary="" role="presentation">
                <tr style="vertical-align: baseline">
                  <td>
                    <div class="B1-Bullet1_inner" style="width: 18pt; white-space: nowrap">
                      <img src="b1.png" alt="*" border="0" width="8" height="8" />
                    </div>
                  </td>
                  <td width="100%">
                    <div class="B1-Bullet1_inner"><span class="LEM-LinkEmphasis"><a href="add%20key%20phrase.aspx" title="Adding a key phrase classifier" name="743216">Adding a key phrase classifier</a></span></div>
                  </td>
                </tr>
              </table>
            </div>
            <div class="B1-Bullet1_outer" style="margin-left: 0pt">
              <table border="0" cellspacing="0" cellpadding="0" summary="" role="presentation">
                <tr style="vertical-align: baseline">
                  <td>
                    <div class="B1-Bullet1_inner" style="width: 18pt; white-space: nowrap">
                      <img src="b1.png" alt="*" border="0" width="8" height="8" />
                    </div>
                  </td>
                  <td width="100%">
                    <div class="B1-Bullet1_inner"><span class="LEM-LinkEmphasis"><a href="add%20lexicon.aspx" title="Adding a dictionary classifier" name="743220">Adding a dictionary classifier</a></span></div>
                  </td>
                </tr>
              </table>
            </div>
            <div class="B1-Bullet1_outer" style="margin-left: 0pt">
              <table border="0" cellspacing="0" cellpadding="0" summary="" role="presentation">
                <tr style="vertical-align: baseline">
                  <td>
                    <div class="B1-Bullet1_inner" style="width: 18pt; white-space: nowrap">
                      <img src="b1.png" alt="*" border="0" width="8" height="8" />
                    </div>
                  </td>
                  <td width="100%">
                    <div class="B1-Bullet1_inner"><span class="LEM-LinkEmphasis"><a href="File%20types.aspx" title="File properties" name="743225">File properties</a></span></div>
                  </td>
                </tr>
              </table>
            </div>
            <script type="text/javascript" language="JavaScript1.2">WebWorks_WriteDIVClose();</script>
          </td>
        </tr>
      </table>
      <div class="B-Body"><a name="601459">To view or manage a list of content classifiers based on patterns:</a></div>
      <div class="S-Step_outer" style="margin-left: 0pt">
        <table border="0" cellspacing="0" cellpadding="0" summary="" role="presentation">
          <tr style="vertical-align: baseline">
            <td>
              <div class="S-Step_inner" style="width: 18pt; white-space: nowrap">1.	</div>
            </td>
            <td width="100%">
              <div class="S-Step_inner"><a name="601466">Click </a><span class="B-Bold">Main &gt; Policy Management &gt; Content Classifiers</span>.</div>
            </td>
          </tr>
        </table>
      </div>
      <div class="S-Step_outer" style="margin-left: 0pt">
        <table border="0" cellspacing="0" cellpadding="0" summary="" role="presentation">
          <tr style="vertical-align: baseline">
            <td>
              <div class="S-Step_inner" style="width: 18pt; white-space: nowrap">2.	</div>
            </td>
            <td width="100%">
              <div class="S-Step_inner"><a name="601460">Select </a><span class="B-Bold">Patterns &amp; Phrases</span>. Both user-defined and built-in patterns are shown. These are distinguished by the icons and the Type column. You can sort the list by this column. Refer to <span class="URL-URL"><a href="https://help.forcepoint.com/docs/data/v83/policy_classifier/predef%20classifiers.aspx" target="external_window">Predefined Classifiers</a></span> for details about each Pattern &amp; Phrase classifier. </div>
            </td>
          </tr>
        </table>
      </div>
      <div class="I-IndentedText"><a name="649449">Also shown are the existing dictionary and key phrase classifiers, if any.</a></div>
      <div class="B-Body"><a name="598017">Click </a><span class="B-Bold">New</span> to add a new regular expression, key phrase, or dictionary, <span class="B-Bold">Delete</span> to delete the selected classifier, or <span class="B-Bold">Where Used</span> to view where the classifier is used. The column, <span class="B-Bold">Used in a Policy</span>, indicates whether the classifier is used in a policy at all. </div>
      <div class="B-Body"><a name="837779">RegEx patterns are special text strings for describing search patterns that can be detected within content. (Content includes the body of the content as well as any attachments). You define the patterns to look for in content and you set the action to take when a pattern is found. </a></div>
      <div class="B-Body"><a name="598019">For example, the string "a\d+" matches all strings that start with the letter "a" and are followed by at least one digit, where "\d" represents any digit and "+" represents "at least one." When the extracted text from a transaction is scanned, TRITON&nbsp;AP-DATA uses regular expressions to find strings in the text that match patterns for confidential information. For example, this is a very basic regular expression for catching Visa credit card numbers: </a></div>
      <div class="CO-Code"><a name="598020">\b(4\d{3}[\-\\]\d{4}[\-\\]\d{4}[\-\\]\d{4})\b </a></div>
      <div class="B-Body"><a name="598021">Because a regular expression file contains many internal attributes, if it is improperly written it can create many false-positive incidents, slow down the system, and impede analysis. </a></div>
      <div class="B-Body"><a name="598023">One way of mitigating false positives in a pattern is to exclude certain values that falsely match it. When defining the classifier, you can define a </a><span class="EM-Emphasis">Pattern to exclude</span> listing words or phrases that are exceptions to the pattern rule (search for all Social Security numbers except these numbers that look like Social Security numbers but are not). </div>
      <div class="B-Body"><a name="598024">You can also add a </a><span class="EM-Emphasis">List of phrases to exclude </span>listing words or phrases that, when found in combination with the pattern, affect whether or not the content is considered suspicious. </div>
      <div class="B-Body"><a name="624641">Another way to mitigate false positives is to consider the pattern as suspicious only when some other pattern or set of words appear in the analyzed data. To do this, you create another content classifier (a pattern, dictionary or any other), and combine the 2 in the condition of your rule with an AND operator.</a></div>
      <div class="B-Body"><a name="624619">When creating a rule for your policy, you can specify how many instances (matches) of the pattern must be found before the content is considered suspicious enough for the action to be taken (for example, 2 Social Security numbers seems reasonable, but 4 is already suspect). You do this on the </a><span class="B-Bold">Condition</span> tab of the <span class="B-Bold">Rule Properties </span>sheet.</div>
      <div class="B-Body"><a name="598025">For each content transmission, the system tallies the number of instances in which the pattern was found in the content. </a></div>
      <div class="B-Body"><a name="598026">If the number of pattern matches is less than the number of matches set, the content is not considered suspicious and there is no further analysis. </a></div>
      <div class="B-Body"><a name="598027">If the number of pattern matches is equal to or greater than the number of matches set, the content triggers the action specified in the rule that uses this pattern. </a></div>
      <div class="B-Body"><a name="598028">Example: </a></div>
      <div class="B-Body"><a name="598029">The pattern is Social Security numbers and the number of matches is 4. The body of an email contains 3 Social Security numbers; the subject contains 2 Social Security numbers. Since there were 5 pattern matches, and this is greater than the number of set matches, the message triggers the action specified in the rule that uses this pattern. </a></div>
      <div class="N4H-Heading4"><a name="598030">When a pattern to exclude is added</a></div>
      <div class="B-Body"><a name="598031">You can define a list of exceptions to the pattern. This is a list of content that matches the pattern but should not be considered in the tally of pattern matches. For each content transmitted, the system tallies the number of instances in which the pattern was found in the content, and subtracts the number of pattern-matches that are included in the Exclude list and compares this final number with the number of matches set. </a></div>
      <div class="B-Body"><a name="782738">Example: </a></div>
      <div class="B-Body"><a name="601442">The pattern is Social Security numbers, the number of matches is 2, and the list of excluded patterns is: 111-11-1111, 222-22-2222, and 333 33 3333 (total of three in the excluded list). The email contains 7 Social Security numbers: 111-11-1111, 222-33-4444, 444-55-6666, 555-66-7777, 222-22-2222, 777888-9999, 333-33-3333. The number of pattern matches is 7, minus 3 excluded patterns that were found in the email, thus equal to 4. Since 4 is greater than the number of matches (2), the message triggers the action specified in the rule that uses this pattern. </a></div>
      <div class="N4H-Heading4"><a name="598035">When a list of phrases to exclude is added</a></div>
      <div class="B-Body"><a name="598036">You can add a String List that lists suspicious words to the patterns. When you do, for each content item transmitted, the action specified in the rule that uses this pattern is triggered only if the total number of pattern matches is above the number of matches and a word from the specified dictionary was found. If the number of matches is reached but no words from the dictionary are present, no further analysis is performed. </a></div>
      <div class="B-Body"><a name="598037">Example: </a></div>
      <div class="B-Body"><a name="598038">The pattern is Social Security numbers, the number of matches is 2, and the String List contains the phrases "Social Security" and "credit card." The distributed content contains 3 Social Security numbers: 111-22-3333, 222-33-4444, 444-55-6666, but none of the words were found. Since the number of found distributed content (3) is greater than the number of matches (2), but there were no dictionary words in the email, no action is taken. </a></div>
    </div>
    <!--googleoff: all-->
    <div class="library_search">
      <form class="support_search" action="/content/kb-search.aspx" method="get">
        <label></label>
        <label></label>
        <input type="text" name="q" value=" Search eSupport" onfocus="if (this.value == ' Search eSupport') {this.value = '';}" onblur="if (this.value == '') {this.value = ' Search eSupport';}"></input>
        <input type="submit" value=" "></input>
      </form>
    </div>
    <br class="clear" />
    <!-- New Navigation DIV -->
    <div class="TL_nav" style="text-align: left;">
      <table cellspacing="0" class="toolBarTable" summary="">
        <!-- End New Navigation DIV -->
        <tr>
          <td>
            <!-- New Go To TOC -->
            <a href="toc.aspx"><img src="images/toc.png" alt="Go to the table of contents" border="0" /></a>
            <!-- End Go To TOC -->
          </td>
          <td>
            <!-- New Previous -->
            <a href="classifier%20details.aspx"><img src="images/prev.png" alt="Go to the previous page" border="0" /></a>
            <!-- End New Previous -->
          </td>
          <td>
            <!-- New Next (Active) -->
            <a href="Add%20Pattern.aspx"><img src="images/next.png" alt="Go to the next page" border="0" /></a>
            <!-- End New Next (Active) -->
          </td>
          <td>
            <!-- New PDF -->
            <a href="Data%20Security%208.3.pdf"><img src="images/pdf.png" alt="View or print as PDF" border="0" /></a>
            <!-- End New PDF -->
          </td>
          <!--Start JR breadcrumbs -->
          <td width="20px"></td>
          <td>
            <div class="WebWorks_Breadcrumbs" style="text-align: left;">
              <a class="WebWorks_Breadcrumb_Link" href="content%20classifiers.aspx">Classifying Content</a> &gt; Patterns &amp; Phrases</div>
          </td>
          <!--End JR breadcrumbs -->
        </tr>
      </table>
    </div>
    <div class="extFooterContainer">
      <div class="extFooter">
        <div align="center">Copyright 2016 Forcepoint LLC. All rights reserved.</div>
      </div>
    </div>
    <SCRIPT>
   function getFileName() {
      //this gets the full url
      var url = document.location.href;
      //this removes the anchor at the end, if there is one
      url = url.substring(0, (url.indexOf("#") == -1) ? url.length : url.indexOf("#"));
      //this removes the query after the file name, if there is one
      url = url.substring(0, (url.indexOf("?") == -1) ? url.length : url.indexOf("?"));
      //this removes everything before the last slash in the path
      url = url.substring(url.lastIndexOf("/") + 1, url.length);
      //return
      return url;
   }

   var url = document.URL;
   var Docname = getFileName()
   s.pageName = "enu:support:technical library:datahelp83:" + Docname;
   s.prop1 = "enu:support";
   s.prop2 = "enu:support:technical library";
   s.channel = "support";
   // <!--
   s.server = "<%= System.Environment.MachineName %>";
   //--></SCRIPT>
    <script language="javascript1.1" type="text/javascript">
   /********Do Not alter below this line ***********/
   var s_code = s.t(); if (s_code) document.write(s_code)
   //--&gt;</script>
  </body>
  <!--"GENERALQUARTERSALLHANDSMANYOURSTATIONS"-->
</html>