Remove And Blackout Email and SSN Data From PDF - C#
PDF Search and Delete Text from PDF sample in C# demonstrating ‘Remove And Blackout Email and SSN Data From PDF’
Program.cs
using System;
using System.IO;
using System.Net;
using Newtonsoft.Json.Linq;
using System.Threading;
using System.Collections.Generic;
using Newtonsoft.Json;
// Cloud API asynchronous "Delete Text from PDF" job example.
namespace ByteScoutWebApiExample
{
class Program
{
// The authentication key (API Key).
// Get your own by registering at https://app.pdf.co
const String API_KEY = "YOUR_PDFco_API_KEY_HERE";
// Source PDF file
const string SourceFile = @".\sample.pdf";
// PDF document password. Leave empty for unprotected documents.
const string Password = "";
// Regex Enabled Search
const bool RegexEnabled = true;
// Destination PDF file name
const string DestinationFile = @".\result.pdf";
static void Main(string[] args)
{
// Upload file to the cloud
string uploadedFileUrl = UploadFile(SourceFile);
if (string.IsNullOrEmpty(uploadedFileUrl))
{
Console.WriteLine("File upload error.");
return;
}
// Regular Expression to Search for SSN
string regex_ssn = @"[0-9]{3}-[0-9]{2}-[0-9]{4}";
// Regular Expression to Search Email Address
string regex_email = @"[A-Za-z0-9._%+-]+@[A-Za-z0-9.-]+\.[A-Za-z]{2,6}";
// Create standard .NET web client instance
WebClient webClient = new WebClient();
// Set API Key
webClient.Headers.Add("x-api-key", API_KEY);
// Prepare requests params as JSON
// See documentation: https://apidocs.pdf.co/#pdf-search-and-delete-text-from-pdf
Dictionary<string, object> parameters = new Dictionary<string, object>();
parameters.Add("name", Path.GetFileName(DestinationFile));
parameters.Add("password", Password);
parameters.Add("url", uploadedFileUrl);
parameters.Add("searchStrings", new string[] { regex_ssn, regex_email });
parameters.Add("regex", RegexEnabled);
// Important: Specify Blackout Color
parameters.Add("profiles", @"{'UsePatch': true, 'PatchColor': '#000000'}");
parameters.Add("async", true); // ! Making Async request
// Convert dictionary of params to JSON
string jsonPayload = JsonConvert.SerializeObject(parameters);
// URL of `Delete Text from PDF` API call
string url = "https://api.pdf.co/v1/pdf/edit/delete-text";
try
{
// Execute POST request with JSON payload
string response = webClient.UploadString(url, jsonPayload);
// Parse JSON response
JObject json = JObject.Parse(response);
if (json["error"].ToObject<bool>() == false)
{
// Asynchronous job ID
string jobId = json["jobId"].ToString();
// URL of generated PDF file that will available after the job completion
string resultFileUrl = json["url"].ToString();
// Check the job status in a loop.
// If you don't want to pause the main thread you can rework the code
// to use a separate thread for the status checking and completion.
do
{
string status = CheckJobStatus(jobId); // Possible statuses: "working", "failed", "aborted", "success".
// Display timestamp and status (for demo purposes)
Console.WriteLine(DateTime.Now.ToLongTimeString() + ": " + status);
if (status == "success")
{
// Download PDF file
webClient.DownloadFile(resultFileUrl, DestinationFile);
Console.WriteLine("Generated PDF file saved as \"{0}\" file.", DestinationFile);
break;
}
else if (status == "working")
{
// Pause for a few seconds
Thread.Sleep(3000);
}
else
{
Console.WriteLine(status);
break;
}
}
while (true);
}
else
{
Console.WriteLine(json["message"].ToString());
}
}
catch (WebException e)
{
Console.WriteLine(e.ToString());
}
webClient.Dispose();
Console.WriteLine();
Console.WriteLine("Press any key...");
Console.ReadKey();
}
/// <summary>
/// Uploads file to the cloud and return URL of uploaded file to use in further API calls.
/// </summary>
/// <param name="file">Source file name (path).</param>
/// <returns>URL of uploaded file</returns>
static string UploadFile(string file)
{
// Create standard .NET web client instance
WebClient webClient = new WebClient();
// Set API Key
webClient.Headers.Add("x-api-key", API_KEY);
try
{
// 1. RETRIEVE THE PRESIGNED URL TO UPLOAD THE FILE.
// * If you already have a direct file URL, skip to the step 3.
// Prepare URL for `Get Presigned URL` API call
string query = Uri.EscapeUriString(string.Format(
"https://api.pdf.co/v1/file/upload/get-presigned-url?contenttype=application/octet-stream&name={0}",
Path.GetFileName(file)));
// Execute request
string response = webClient.DownloadString(query);
// Parse JSON response
JObject json = JObject.Parse(response);
if (json["error"].ToObject<bool>() == false)
{
// Get URL to use for the file upload
string uploadUrl = json["presignedUrl"].ToString();
// Get URL of uploaded file to use with later API calls
string uploadedFileUrl = json["url"].ToString();
// 2. UPLOAD THE FILE TO CLOUD.
webClient.Headers.Add("content-type", "application/octet-stream");
webClient.UploadFile(uploadUrl, "PUT", file); // You can use UploadData() instead if your file is in byte[] or Stream
return uploadedFileUrl;
}
else
{
// Display service reported error
Console.WriteLine(json["message"].ToString());
}
}
catch (Exception e)
{
Console.WriteLine(e);
throw;
}
finally
{
webClient.Dispose();
}
return null;
}
static string CheckJobStatus(string jobId)
{
using (WebClient webClient = new WebClient())
{
// Set API Key
webClient.Headers.Add("x-api-key", API_KEY);
string url = "https://api.pdf.co/v1/job/check?jobid=" + jobId;
string response = webClient.DownloadString(url);
JObject json = JObject.Parse(response);
return Convert.ToString(json["status"]);
}
}
}
}
PDF.co Web API: the Web API with a set of tools for documents manipulation, data conversion, data extraction, splitting and merging of documents. Includes image recognition, built-in OCR, barcode generation and barcode decoders to decode bar codes from scans, pictures and pdf.
Download Source Code (.zip)
return to the previous page explore PDF Search and Delete Text from PDF endpoint
Copyright © 2016 - 2024 PDF.co