More languages
Some test text!
More languages
Sample Ruby code for using PDFTron SDK to create Unicode text and embed composite fonts in PDF files. Learn more about our Ruby PDF Library.
Get Started Samples DownloadTo run this sample, get started with a free trial of Apryse SDK.
#---------------------------------------------------------------------------------------
# Copyright (c) 2001-2023 by Apryse Software Inc. All Rights Reserved.
# Consult LICENSE.txt regarding license information.
#---------------------------------------------------------------------------------------
require '../../../PDFNetC/Lib/PDFNetRuby'
include PDFNetRuby
require '../../LicenseKey/RUBY/LicenseKey'
$stdout.sync = true
# Relative path to the folder containing the test files.
$input_path = "../../TestFiles/"
$output_path = "../../TestFiles/Output/"
# This example illustrates how to create Unicode text and how to embed composite fonts.
#
# Note: This demo assumes that 'arialuni.ttf' is present in '/Samples/TestFiles'
# directory. Arial Unicode MS is about 24MB in size and it comes together with Windows and
# MS Office.
#
# For more information about Arial Unicode MS, please consult the following Microsoft Knowledge
# Base Article: WD2002: General Information About the Arial Unicode MS Font
# http://support.microsoft.com/support/kb/articles/q287/2/47.asp
#
# For more information consult:
# http://office.microsoft.com/search/results.aspx?Scope=DC&Query=font&CTT=6&Origin=EC010331121033
# http://www.microsoft.com/downloads/details.aspx?FamilyID=1F0303AE-F055-41DA-A086-A65F22CB5593
#
# In case you don't have access to Arial Unicode MS you can use cyberbit.ttf
# (http://ftp.netscape.com/pub/communicator/extras/fonts/windows/) instead.
def main()
PDFNet.Initialize(PDFTronLicense.Key)
doc = PDFDoc.new
eb = ElementBuilder.new
writer = ElementWriter.new
# Start a new page ------------------------------------
page = doc.PageCreate(Rect.new(0, 0, 612, 794))
writer.Begin(page) # begin writing to this page
# Embed and subset the font
font_program = $input_path + "ARIALUNI.TTF"
if not File.file?(font_program)
if ENV['OS'] == "Windows_NT"
font_program = "C:/Windows/Fonts/ARIALUNI.TTF"
puts "Note: Using ARIALUNI.TTF from C:/Windows/Fonts directory."
end
end
begin
fnt = Font.CreateCIDTrueTypeFont(doc.GetSDFDoc(), font_program, true, true)
rescue
end
if not fnt.nil?
puts "Note: using " + font_program + " for unshaped unicode text"
else
puts "Note: using system font substitution for unshaped unicode text"
fnt = Font.Create(doc.GetSDFDoc(), "Helvetica", "")
end
element = eb.CreateTextBegin(fnt, 1)
element.SetTextMatrix(10, 0, 0, 10, 50, 600)
element.GetGState.SetLeading(2) # Set the spacing between lines
writer.WriteElement(element)
# Hello World!
hello = ['H','e','l','l','o',' ','W','o','r','l','d','!']
writer.WriteElement(eb.CreateUnicodeTextRun(hello, hello.length))
writer.WriteElement(eb.CreateTextNewLine)
# Latin
latin = ['a', 'A', 'b', 'B', 'c', 'C', 'd', 'D', 0x45, 0x0046, 0x00C0,
0x00C1, 0x00C2, 0x0143, 0x0144, 0x0145, 0x0152, '1', '2' ]# etc.
writer.WriteElement(eb.CreateUnicodeTextRun(latin, latin.length))
writer.WriteElement(eb.CreateTextNewLine)
# Greek
greek = [0x039E, 0x039F, 0x03A0, 0x03A1,0x03A3, 0x03A6, 0x03A8, 0x03A9]
writer.WriteElement(eb.CreateUnicodeTextRun(greek, greek.length))
writer.WriteElement(eb.CreateTextNewLine)
# Cyrillic
cyrillic = [0x0409, 0x040A, 0x040B, 0x040C, 0x040E, 0x040F, 0x0410, 0x0411,
0x0412, 0x0413, 0x0414, 0x0415, 0x0416, 0x0417, 0x0418, 0x0419]
writer.WriteElement(eb.CreateUnicodeTextRun(cyrillic, cyrillic.length))
writer.WriteElement(eb.CreateTextNewLine)
# Hebrew
hebrew = [0x05D0, 0x05D1, 0x05D3, 0x05D3, 0x05D4, 0x05D5, 0x05D6, 0x05D7, 0x05D8,
0x05D9, 0x05DA, 0x05DB, 0x05DC, 0x05DD, 0x05DE, 0x05DF, 0x05E0, 0x05E1]
writer.WriteElement(eb.CreateUnicodeTextRun(hebrew, hebrew.length))
writer.WriteElement(eb.CreateTextNewLine)
# Arabic
arabic = [0x0624, 0x0625, 0x0626, 0x0627, 0x0628, 0x0629, 0x062A, 0x062B, 0x062C,
0x062D, 0x062E, 0x062F, 0x0630, 0x0631, 0x0632, 0x0633, 0x0634, 0x0635]
writer.WriteElement(eb.CreateUnicodeTextRun(arabic, arabic.length))
writer.WriteElement(eb.CreateTextNewLine)
# Thai
thai = [0x0E01, 0x0E02, 0x0E03, 0x0E04, 0x0E05, 0x0E06, 0x0E07, 0x0E08, 0x0E09,
0x0E0A, 0x0E0B, 0x0E0C, 0x0E0D, 0x0E0E, 0x0E0F, 0x0E10, 0x0E11, 0x0E12]
writer.WriteElement(eb.CreateUnicodeTextRun(thai, thai.length))
writer.WriteElement(eb.CreateTextNewLine)
# Hiragana - Japanese
hiragana = [0x3041, 0x3042, 0x3043, 0x3044, 0x3045, 0x3046, 0x3047, 0x3048, 0x3049,
0x304A, 0x304B, 0x304C, 0x304D, 0x304E, 0x304F, 0x3051, 0x3051, 0x3052]
writer.WriteElement(eb.CreateUnicodeTextRun(hiragana, hiragana.length))
writer.WriteElement(eb.CreateTextNewLine)
# CJK Unified Ideographs
cjk_uni = [0x5841, 0x5842, 0x5843, 0x5844, 0x5845, 0x5846, 0x5847, 0x5848, 0x5849,
0x584A, 0x584B, 0x584C, 0x584D, 0x584E, 0x584F, 0x5850, 0x5851, 0x5852]
writer.WriteElement(eb.CreateUnicodeTextRun(cjk_uni, cjk_uni.length))
writer.WriteElement(eb.CreateTextNewLine)
# Simplified Chinese
chinese_simplified = [0x4e16, 0x754c, 0x60a8, 0x597d]
writer.WriteElement(eb.CreateUnicodeTextRun(chinese_simplified, chinese_simplified.length))
writer.WriteElement(eb.CreateTextNewLine)
puts "Now using text shaping logic to place text"
# Create a font in indexed encoding mode
# normally this would mean that we are required to provide glyph indices
# directly to CreateUnicodeTextRun, but instead, we will use the GetShapedText
# method to take care of this detail for us.
indexed_font = Font.CreateCIDTrueTypeFont(doc.GetSDFDoc(), $input_path + "NotoSans_with_hindi.ttf", true, true, Font::E_Indices)
element = eb.CreateTextBegin(indexed_font, 10)
writer.WriteElement(element)
line_pos = 350.0
line_space = 20.0
# Transform unicode text into an abstract collection of glyph indices and positioning info
shaped_text = indexed_font.GetShapedText("Shaped Hindi Text:")
# transform the shaped text info into a PDF element and write it to the page
element = eb.CreateShapedTextRun(shaped_text)
element.SetTextMatrix(1.5, 0, 0, 1.5, 50, line_pos)
writer.WriteElement(element)
# read in unicode text lines from a file
line_num=0
File.open($input_path +"hindi_sample_utf16le.txt", "rb:UTF-16LE").each do |line|
line_num += 1
end
puts "Read in %d lines of Unicode text from file" % line_num
i=0
File.open($input_path + "hindi_sample_utf16le.txt", "rb:UTF-16LE") do |f|
f.each_line do |line|
begin
shaped_text = indexed_font.GetShapedText(line[0..-2].encode('utf-8'))
element = eb.CreateShapedTextRun(shaped_text)
element.SetTextMatrix(1.5, 0, 0, 1.5, 50, line_pos-line_space*(i+1))
writer.WriteElement(element)
puts "Wrote shaped line to page"
i+=1
rescue
end
end
end
# Finish the block of text
writer.WriteElement(eb.CreateTextEnd())
# Finish the block of text
writer.WriteElement(eb.CreateTextEnd)
writer.End # save changes to the current page
doc.PagePushBack(page)
doc.Save($output_path + "unicodewrite.pdf", SDFDoc::E_remove_unused | SDFDoc::E_hex_strings)
puts "Done. Result saved in unicodewrite.pdf..."
doc.Close
PDFNet.Terminate
end
main()