1

我编写了一个程序,在一个包含许多有效和无效电子邮件的文本文件中查找有效的电子邮件地址。

& 然后在另一个文本文件中输出有效的电子邮件。

我遇到的问题是创建一个子字符串或对象,它将读取@符号左侧的行,如果有多个“。”,则读取为真。

例如:将这行文本作为有效的电子邮件阅读 - Jimmy.Cole@yahoo.com

&

如果有更多的“。” @ 符号后读为假。这是我的代码:

#include<iostream>
#include<string>
#include<fstream>
using namespace std;
const string DEFAULT_INPUT_FILENAME="fileContainingEmails.txt";
const string DEFAULT_OUTPUT_FILENAME="copyPasteMyEmails.txt";
const int N=1000;   //assuming atmost 1000 email 

//function prototypes
bool isNotDuplicateEmail(string emails[], int emailCount, string emailTemp);
bool isValidEmail(string emails[], string emailTemp);
void WriteToFile(string emails[], int emailCount, string outputFile);
void DisplayEmailsToConsole(string emails[], int emailCount);
bool isValidEmailChar(char c);
int countOccurenceOfAt(string emailTemp);
int countOccurenceOfDot(string emailTemp);

int main()
{
    //variable declaration
    ifstream fin;
    string inputFile;
    string outputFile;
    int emailCount=0;
    string emails[N];


    //ask user for input and output file name
    cout<<"Enter input file name: ";
    getline(cin,inputFile);
    cout<<"Enter output file name: ";
    getline(cin,outputFile);

    //check for default names
    if(inputFile=="")
        inputFile=DEFAULT_INPUT_FILENAME;
    if(outputFile=="")
        outputFile=DEFAULT_OUTPUT_FILENAME;

    cout<<"Input File Name = "<<inputFile<<endl;
    cout<<"Output File Name = "<<outputFile<<endl;

    //open input file
    fin.open(inputFile.c_str());
    //if file does not exists, display error message and return
    if(!fin)
    {
        cout<<"ERROR: "<<inputFile<<" doen not exists."<<endl;
        return 1;
    }

    string emailTemp;
    /*read each line from file, and if it is not a duplicate email and a valid email
    then add it to email list and increment count*/
    while(getline(fin,emailTemp))
    {
        if(isNotDuplicateEmail(emails,emailCount,emailTemp) && isValidEmail(emails,emailTemp))
        {
            emails[emailCount]=emailTemp;
            emailCount++;
        }
    }
    //close input file
    fin.close();

    //call function to write emails to output file and console
    if(emailCount>0)
    {
        WriteToFile(emails, emailCount, outputFile);
        cout << endl << emailCount << " email addresses were found, and copied to the file " << outputFile<<endl;
        DisplayEmailsToConsole(emails, emailCount);
    }
    else
    {
        cout << "Sorry, no email addresses were found in the file " << inputFile << endl;
    }


    cout << endl<< "Press ENTER to continue..." << endl;
    cin.get();
    return 0;
}

bool isNotDuplicateEmail(string emails[], int emailCount, string emailTemp)
{
    /*Check each email address and if a duplicate email is found, return false*/
    /*If email is not a duplicate email, return true*/
    for(int i=0;i<emailCount;i++)
    {
        if(emailTemp==emails[i])
            return false;
    }
    return true;
}
bool isValidEmail(string emails[], string emailTemp)
{
    if(emailTemp=="")
        return false;
    /*If there are more than 1 @*/
    if (countOccurenceOfAt(emailTemp)!=1)
        return false;
    /*If there are more than 1 .*/
    if(countOccurenceOfDot(emailTemp)!=1)
        return false;


    int index1=-1;
    int index2=-1;


    //check each character for valid email char
    for (int i=0; i<emailTemp.size(); i++)
    {
        if(!isValidEmailChar(emailTemp[i]))
            return false;
    }

    //find index of @ and .
    index1=emailTemp.find_first_of('@');
    index2=emailTemp.find_first_of('.');

    if(index1<1)
        return false;
    if(index2<index1)
        return false;
    if((index2-index1)==1)
        return false;

    if(((emailTemp.size()-1)-index2)==0)
        return false;

    return true;
}

bool isValidEmailChar(char c)
{
    /* check for valid email characters 0-9, @, ., A-Z, a-z, _, +, - */
    if(c>='0' && c<='9')
        return true;
    if(c>='A' && c<='Z')
        return true;
    if(c>='a' && c<='z')
        return true;
    if(c=='@' || c=='.' || c=='_' || c=='+' || c=='-')
        return true;

    return false;

}

/*Function to count occurence of @ in email address*/
int countOccurenceOfAt(string emailTemp)
{
    int count=0;
    for(int i=0;i<emailTemp.size();i++)
    {
        if(emailTemp[i]=='@')
            count++;
    }
    return count;
}

/*Function to count occurence of . in email address*/
int countOccurenceOfDot(string emailTemp)
{
    int count=0;
    for(int i=0;i<emailTemp.size();i++)
    {
        if(emailTemp[i]=='.')
            count++;
    }
    return count;
}

void DisplayEmailsToConsole(string emails[], int emailCount)
{
    /*Display console message and then display each email address, one at a line*/
    cout << endl << endl << "You can open the output file and copy/paste its contents into the \"to\", \"cc\", or \"bcc\" field of any email message. It is best to use the \"bcc\" field so that everyone's email address does not appear in the message, to protect their privacy"<<endl;
    cout << endl << "Email List is: "<< endl;
    for (int i=0; i<emailCount; i++)
    {
        cout << emails[i] << endl;
        cout << endl;
    }
}

void WriteToFile(string emails[], int emailCount, string outputFile)
{
    /*Open file and write each email address to output file followed by ; */
    ofstream fout;
    fout.open(outputFile.c_str());
    for(int i=0; i<emailCount; i++)
    {
        fout << emails[i] << "; " << endl;
    }
    //close file
    fout.close();
}
4

3 回答 3

1

以下代码来自《Secure Programming Cookbook for C and C++ 》一书:

#include <string.h>

int spc_email_isvalid(const char *address) {
  int        count = 0;
  const char *c, *domain;
  static char *rfc822_specials = "()<>@,;:\\\"[]";

  /* first we validate the name portion (name@domain) */
  for (c = address;  *c;  c++) {
    if (*c == '\"' && (c == address || *(c - 1) == '.' || *(c - 1) == 
        '\"')) {
      while (*++c) {
        if (*c == '\"') break;
        if (*c == '\\' && (*++c == ' ')) continue;
        if (*c <= ' ' || *c >= 127) return 0;
      }
      if (!*c++) return 0;
      if (*c == '@') break;
      if (*c != '.') return 0;
      continue;
    }
    if (*c == '@') break;
    if (*c <= ' ' || *c >= 127) return 0;
    if (strchr(rfc822_specials, *c)) return 0;
  }
  if (c == address || *(c - 1) == '.') return 0;

  /* next we validate the domain portion (name@domain) */
  if (!*(domain = ++c)) return 0;
  do {
    if (*c == '.') {
      if (c == domain || *(c - 1) == '.') return 0;
      count++;
    }
    if (*c <= ' ' || *c >= 127) return 0;
    if (strchr(rfc822_specials, *c)) return 0;
  } while (*++c);

  return (count >= 1);
}
于 2012-07-23T18:04:10.973 回答
1

如果您只需要知道 @ 符号之前是否有多个句点,那么只需执行以下操作:

if (email.find_first_of('.') == email.find_last_of('.'))

如果该表达式返回 true,那么您知道该字符串只有一个句点(或没有句点)。

于 2012-07-23T18:11:50.503 回答
1

看看这个链接: http: //www.codeproject.com/Articles/22777/Email-Address-Validation-Using-Regular-Expression

您可以使用正则表达式来处理具有更好性能的模式匹配。

于 2012-07-23T18:05:59.633 回答