View Javadoc
1   /*
2    * Copyright (c) 2002-2019, Mairie de Paris
3    * All rights reserved.
4    *
5    * Redistribution and use in source and binary forms, with or without
6    * modification, are permitted provided that the following conditions
7    * are met:
8    *
9    *  1. Redistributions of source code must retain the above copyright notice
10   *     and the following disclaimer.
11   *
12   *  2. Redistributions in binary form must reproduce the above copyright notice
13   *     and the following disclaimer in the documentation and/or other materials
14   *     provided with the distribution.
15   *
16   *  3. Neither the name of 'Mairie de Paris' nor 'Lutece' nor the names of its
17   *     contributors may be used to endorse or promote products derived from
18   *     this software without specific prior written permission.
19   *
20   * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
21   * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22   * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23   * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDERS OR CONTRIBUTORS BE
24   * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
25   * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
26   * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
27   * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
28   * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
29   * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
30   * POSSIBILITY OF SUCH DAMAGE.
31   *
32   * License 1.0
33   */
34  
35  package fr.paris.lutece.nlptools;
36  
37  import java.util.ArrayList;
38  import java.util.List;
39  import java.util.regex.Matcher;
40  import java.util.regex.Pattern;
41  
42  /**
43   * EmailFinder
44   */
45  public class EmailFinder extends AbstractFinder
46  {
47      private static final Pattern MAIL_REGEX = Pattern.compile( "[-_.0-9A-Za-z]+@[-_0-9A-Za-z]+[-_.0-9A-Za-z]+" );
48  
49      /**
50       * Constructor
51       */
52      public EmailFinder( )
53      {
54          super( );
55      }
56  
57      /**
58       * Constructor
59       * 
60       * @param strReplacement
61       *            Replacement string
62       */
63      public EmailFinder( String strReplacement )
64      {
65          super( strReplacement );
66      }
67  
68      /**
69       * {@inheritDoc }
70       */
71      @Override
72      public List<String> findOccurrences( String strInputText ) throws FinderException
73      {
74          List<String> listOccurrences = new ArrayList<>( );
75          Matcher matcher = MAIL_REGEX.matcher( strInputText );
76          while ( matcher.find( ) )
77          {
78              String strEntity = matcher.group( );
79              listOccurrences.add( strEntity );
80              addEntity( strEntity );
81          }
82          return listOccurrences;
83      }
84  
85      /**
86       * {@inheritDoc }
87       */
88      @Override
89      public String replaceOccurrences( String strInputText ) throws FinderException
90      {
91          return replaceOccurrences( strInputText, getReplacement( ) );
92      }
93  
94      /**
95       * {@inheritDoc }
96       */
97      @Override
98      public String replaceOccurrences( String strInputText, String strReplacement ) throws FinderException
99      {
100         return MAIL_REGEX.matcher( strInputText ).replaceAll( strReplacement );
101     }
102 
103 }