Reputation: 21
I have written a program that looks for valid email addresses in a text file that has many emails both valid & invalid.
& then outputs the vaild emails in another text file.
The problem i have is creating a substring or object that will read the line left of the @ symbol & read true if there are multiple '.'
for example: read this line of text as a valid email - [email protected]
&
if there are more '.' after the @ symbol read as false. here is my code:
#include<iostream>
#include<string>
#include<fstream>
using namespace std;
const string DEFAULT_INPUT_FILENAME="fileContainingEmails.txt";
const string DEFAULT_OUTPUT_FILENAME="copyPasteMyEmails.txt";
const int N=1000; //assuming atmost 1000 email
//function prototypes
bool isNotDuplicateEmail(string emails[], int emailCount, string emailTemp);
bool isValidEmail(string emails[], string emailTemp);
void WriteToFile(string emails[], int emailCount, string outputFile);
void DisplayEmailsToConsole(string emails[], int emailCount);
bool isValidEmailChar(char c);
int countOccurenceOfAt(string emailTemp);
int countOccurenceOfDot(string emailTemp);
int main()
{
//variable declaration
ifstream fin;
string inputFile;
string outputFile;
int emailCount=0;
string emails[N];
//ask user for input and output file name
cout<<"Enter input file name: ";
getline(cin,inputFile);
cout<<"Enter output file name: ";
getline(cin,outputFile);
//check for default names
if(inputFile=="")
inputFile=DEFAULT_INPUT_FILENAME;
if(outputFile=="")
outputFile=DEFAULT_OUTPUT_FILENAME;
cout<<"Input File Name = "<<inputFile<<endl;
cout<<"Output File Name = "<<outputFile<<endl;
//open input file
fin.open(inputFile.c_str());
//if file does not exists, display error message and return
if(!fin)
{
cout<<"ERROR: "<<inputFile<<" doen not exists."<<endl;
return 1;
}
string emailTemp;
/*read each line from file, and if it is not a duplicate email and a valid email
then add it to email list and increment count*/
while(getline(fin,emailTemp))
{
if(isNotDuplicateEmail(emails,emailCount,emailTemp) && isValidEmail(emails,emailTemp))
{
emails[emailCount]=emailTemp;
emailCount++;
}
}
//close input file
fin.close();
//call function to write emails to output file and console
if(emailCount>0)
{
WriteToFile(emails, emailCount, outputFile);
cout << endl << emailCount << " email addresses were found, and copied to the file " << outputFile<<endl;
DisplayEmailsToConsole(emails, emailCount);
}
else
{
cout << "Sorry, no email addresses were found in the file " << inputFile << endl;
}
cout << endl<< "Press ENTER to continue..." << endl;
cin.get();
return 0;
}
bool isNotDuplicateEmail(string emails[], int emailCount, string emailTemp)
{
/*Check each email address and if a duplicate email is found, return false*/
/*If email is not a duplicate email, return true*/
for(int i=0;i<emailCount;i++)
{
if(emailTemp==emails[i])
return false;
}
return true;
}
bool isValidEmail(string emails[], string emailTemp)
{
if(emailTemp=="")
return false;
/*If there are more than 1 @*/
if (countOccurenceOfAt(emailTemp)!=1)
return false;
/*If there are more than 1 .*/
if(countOccurenceOfDot(emailTemp)!=1)
return false;
int index1=-1;
int index2=-1;
//check each character for valid email char
for (int i=0; i<emailTemp.size(); i++)
{
if(!isValidEmailChar(emailTemp[i]))
return false;
}
//find index of @ and .
index1=emailTemp.find_first_of('@');
index2=emailTemp.find_first_of('.');
if(index1<1)
return false;
if(index2<index1)
return false;
if((index2-index1)==1)
return false;
if(((emailTemp.size()-1)-index2)==0)
return false;
return true;
}
bool isValidEmailChar(char c)
{
/* check for valid email characters 0-9, @, ., A-Z, a-z, _, +, - */
if(c>='0' && c<='9')
return true;
if(c>='A' && c<='Z')
return true;
if(c>='a' && c<='z')
return true;
if(c=='@' || c=='.' || c=='_' || c=='+' || c=='-')
return true;
return false;
}
/*Function to count occurence of @ in email address*/
int countOccurenceOfAt(string emailTemp)
{
int count=0;
for(int i=0;i<emailTemp.size();i++)
{
if(emailTemp[i]=='@')
count++;
}
return count;
}
/*Function to count occurence of . in email address*/
int countOccurenceOfDot(string emailTemp)
{
int count=0;
for(int i=0;i<emailTemp.size();i++)
{
if(emailTemp[i]=='.')
count++;
}
return count;
}
void DisplayEmailsToConsole(string emails[], int emailCount)
{
/*Display console message and then display each email address, one at a line*/
cout << endl << endl << "You can open the output file and copy/paste its contents into the \"to\", \"cc\", or \"bcc\" field of any email message. It is best to use the \"bcc\" field so that everyone's email address does not appear in the message, to protect their privacy"<<endl;
cout << endl << "Email List is: "<< endl;
for (int i=0; i<emailCount; i++)
{
cout << emails[i] << endl;
cout << endl;
}
}
void WriteToFile(string emails[], int emailCount, string outputFile)
{
/*Open file and write each email address to output file followed by ; */
ofstream fout;
fout.open(outputFile.c_str());
for(int i=0; i<emailCount; i++)
{
fout << emails[i] << "; " << endl;
}
//close file
fout.close();
}
Upvotes: 1
Views: 1998
Reputation: 405
If all you need to know is if there are multiple periods before the @ symbol, then just do:
if (email.find_first_of('.') == email.find_last_of('.'))
If that expression returns true, then you know that the string has only one period (or none).
Upvotes: 1
Reputation: 389
Take a look at this link: http://www.codeproject.com/Articles/22777/Email-Address-Validation-Using-Regular-Expression
You can use regular expressions to take care of pattern matching with much better performance.
Upvotes: 1
Reputation: 97948
Following code is from the book Secure Programming Cookbook for C and C++:
#include <string.h>
int spc_email_isvalid(const char *address) {
int count = 0;
const char *c, *domain;
static char *rfc822_specials = "()<>@,;:\\\"[]";
/* first we validate the name portion (name@domain) */
for (c = address; *c; c++) {
if (*c == '\"' && (c == address || *(c - 1) == '.' || *(c - 1) ==
'\"')) {
while (*++c) {
if (*c == '\"') break;
if (*c == '\\' && (*++c == ' ')) continue;
if (*c <= ' ' || *c >= 127) return 0;
}
if (!*c++) return 0;
if (*c == '@') break;
if (*c != '.') return 0;
continue;
}
if (*c == '@') break;
if (*c <= ' ' || *c >= 127) return 0;
if (strchr(rfc822_specials, *c)) return 0;
}
if (c == address || *(c - 1) == '.') return 0;
/* next we validate the domain portion (name@domain) */
if (!*(domain = ++c)) return 0;
do {
if (*c == '.') {
if (c == domain || *(c - 1) == '.') return 0;
count++;
}
if (*c <= ' ' || *c >= 127) return 0;
if (strchr(rfc822_specials, *c)) return 0;
} while (*++c);
return (count >= 1);
}
Upvotes: 1