glob(3f) - [fpm_strings:COMPARE] compare given string for match to
pattern which may contain wildcard characters
(LICENSE:PD)
logical function glob(string, pattern )
character(len=*),intent(in) :: string
character(len=*),intent(in) :: pattern
glob(3f) compares given STRING for match to PATTERN which may contain wildcard characters.
In this version to get a match the entire string must be described by PATTERN. Trailing whitespace is significant, so trim the input string to have trailing whitespace ignored.
string the input string to test to see if it contains the pattern.
pattern the following simple globbing options are available
o "?" matching any one character
o "*" matching zero or more characters.
Do NOT use adjacent asterisks.
o Both strings may have trailing spaces which
are ignored.
o There is no escape character, so matching strings with
literal question mark and asterisk is problematic.
Example program
program demo_glob
implicit none
! This main() routine passes a bunch of test strings
! into the above code. In performance comparison mode,
! it does that over and over. Otherwise, it does it just
! once. Either way, it outputs a passed/failed result.
!
integer :: nReps
logical :: allpassed
integer :: i
allpassed = .true.
nReps = 10000
! Can choose as many repetitions as you're expecting
! in the real world.
nReps = 1
do i=1,nReps
! Cases with repeating character sequences.
allpassed=allpassed .and. test("a*abab", "a*b", .true.)
!!cycle
allpassed=allpassed .and. test("ab", "*?", .true.)
allpassed=allpassed .and. test("abc", "*?", .true.)
allpassed=allpassed .and. test("abcccd", "*ccd", .true.)
allpassed=allpassed .and. test("bLah", "bLaH", .false.)
allpassed=allpassed .and. test("mississippi", "*sip*", .true.)
allpassed=allpassed .and. &
& test("xxxx*zzzzzzzzy*f", "xxx*zzy*f", .true.)
allpassed=allpassed .and. &
& test("xxxx*zzzzzzzzy*f", "xxxx*zzy*fffff", .false.)
allpassed=allpassed .and. &
& test("mississipissippi", "*issip*ss*", .true.)
allpassed=allpassed .and. &
& test("xxxxzzzzzzzzyf", "xxxx*zzy*fffff", .false.)
allpassed=allpassed .and. &
& test("xxxxzzzzzzzzyf", "xxxx*zzy*f", .true.)
allpassed=allpassed .and. test("xyxyxyzyxyz", "xy*z*xyz", .true.)
allpassed=allpassed .and. test("xyxyxyxyz", "xy*xyz", .true.)
allpassed=allpassed .and. test("mississippi", "mi*sip*", .true.)
allpassed=allpassed .and. test("ababac", "*abac*", .true.)
allpassed=allpassed .and. test("aaazz", "a*zz*", .true.)
allpassed=allpassed .and. test("a12b12", "*12*23", .false.)
allpassed=allpassed .and. test("a12b12", "a12b", .false.)
allpassed=allpassed .and. test("a12b12", "*12*12*", .true.)
! Additional cases where the '*' char appears in the tame string.
allpassed=allpassed .and. test("*", "*", .true.)
allpassed=allpassed .and. test("a*r", "a*", .true.)
allpassed=allpassed .and. test("a*ar", "a*aar", .false.)
! More double wildcard scenarios.
allpassed=allpassed .and. test("XYXYXYZYXYz", "XY*Z*XYz", .true.)
allpassed=allpassed .and. test("missisSIPpi", "*SIP*", .true.)
allpassed=allpassed .and. test("mississipPI", "*issip*PI", .true.)
allpassed=allpassed .and. test("xyxyxyxyz", "xy*xyz", .true.)
allpassed=allpassed .and. test("miSsissippi", "mi*sip*", .true.)
allpassed=allpassed .and. test("miSsissippi", "mi*Sip*", .false.)
allpassed=allpassed .and. test("abAbac", "*Abac*", .true.)
allpassed=allpassed .and. test("aAazz", "a*zz*", .true.)
allpassed=allpassed .and. test("A12b12", "*12*23", .false.)
allpassed=allpassed .and. test("a12B12", "*12*12*", .true.)
allpassed=allpassed .and. test("oWn", "*oWn*", .true.)
! Completely tame (no wildcards) cases.
allpassed=allpassed .and. test("bLah", "bLah", .true.)
! Simple mixed wildcard tests suggested by IBMer Marlin Deckert.
allpassed=allpassed .and. test("a", "*?", .true.)
! More mixed wildcard tests including coverage for false positives.
allpassed=allpassed .and. test("a", "??", .false.)
allpassed=allpassed .and. test("ab", "?*?", .true.)
allpassed=allpassed .and. test("ab", "*?*?*", .true.)
allpassed=allpassed .and. test("abc", "?**?*?", .true.)
allpassed=allpassed .and. test("abc", "?**?*&?", .false.)
allpassed=allpassed .and. test("abcd", "?b*??", .true.)
allpassed=allpassed .and. test("abcd", "?a*??", .false.)
allpassed=allpassed .and. test("abcd", "?**?c?", .true.)
allpassed=allpassed .and. test("abcd", "?**?d?", .false.)
allpassed=allpassed .and. test("abcde", "?*b*?*d*?", .true.)
! Single-character-match cases.
allpassed=allpassed .and. test("bLah", "bL?h", .true.)
allpassed=allpassed .and. test("bLaaa", "bLa?", .false.)
allpassed=allpassed .and. test("bLah", "bLa?", .true.)
allpassed=allpassed .and. test("bLaH", "?Lah", .false.)
allpassed=allpassed .and. test("bLaH", "?LaH", .true.)
! Many-wildcard scenarios.
allpassed=allpassed .and. test(&
&"aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa&
&aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaab",&
&"a*a*a*a*a*a*aa*aaa*a*a*b",&
&.true.)
allpassed=allpassed .and. test(&
&"abababababababababababababababababababaacacacacacacac&
&adaeafagahaiajakalaaaaaaaaaaaaaaaaaffafagaagggagaaaaaaaab",&
&"*a*b*ba*ca*a*aa*aaa*fa*ga*b*",&
&.true.)
allpassed=allpassed .and. test(&
&"abababababababababababababababababababaacacacacacaca&
&cadaeafagahaiajakalaaaaaaaaaaaaaaaaaffafagaagggagaaaaaaaab",&
&"*a*b*ba*ca*a*x*aaa*fa*ga*b*",&
&.false.)
allpassed=allpassed .and. test(&
&"abababababababababababababababababababaacacacacacacacad&
&aeafagahaiajakalaaaaaaaaaaaaaaaaaffafagaagggagaaaaaaaab",&
&"*a*b*ba*ca*aaaa*fa*ga*gggg*b*",&
&.false.)
allpassed=allpassed .and. test(&
&"abababababababababababababababababababaacacacacacacacad&
&aeafagahaiajakalaaaaaaaaaaaaaaaaaffafagaagggagaaaaaaaab",&
&"*a*b*ba*ca*aaaa*fa*ga*ggg*b*",&
&.true.)
allpassed=allpassed .and. test("aaabbaabbaab", "*aabbaa*a*", .true.)
allpassed=allpassed .and. &
test("a*a*a*a*a*a*a*a*a*a*a*a*a*a*a*a*a*",&
&"a*a*a*a*a*a*a*a*a*a*a*a*a*a*a*a*a*", .true.)
allpassed=allpassed .and. test("aaaaaaaaaaaaaaaaa",&
&"*a*a*a*a*a*a*a*a*a*a*a*a*a*a*a*a*a*", .true.)
allpassed=allpassed .and. test("aaaaaaaaaaaaaaaa",&
&"*a*a*a*a*a*a*a*a*a*a*a*a*a*a*a*a*a*", .false.)
allpassed=allpassed .and. test(&
&"abc*abcd*abcde*abcdef*abcdefg*abcdefgh*abcdefghi*abcdefghij&
&*abcdefghijk*abcdefghijkl*abcdefghijklm*abcdefghijklmn",&
& "abc*abc*abc*abc*abc*abc*abc*abc*abc*abc*abc*abc*abc*abc&
&*abc*abc*abc*",&
&.false.)
allpassed=allpassed .and. test(&
&"abc*abcd*abcde*abcdef*abcdefg*abcdefgh*abcdefghi*abcdefghij&
&*abcdefghijk*abcdefghijkl*abcdefghijklm*abcdefghijklmn",&
&"abc*abc*abc*abc*abc*abc*abc*abc*abc*abc*abc*abc*",&
&.true.)
allpassed=allpassed .and. test("abc*abcd*abcd*abc*abcd",&
&"abc*abc*abc*abc*abc", .false.)
allpassed=allpassed .and. test( "abc*abcd*abcd*abc*abcd*abcd&
&*abc*abcd*abc*abc*abcd", &
&"abc*abc*abc*abc*abc*abc*abc*abc*abc*abc*abcd",&
&.true.)
allpassed=allpassed .and. test("abc",&
&"********a********b********c********", .true.)
allpassed=allpassed .and.&
&test("********a********b********c********", "abc", .false.)
allpassed=allpassed .and. &
&test("abc", "********a********b********b********", .false.)
allpassed=allpassed .and. test("*abc*", "***a*b*c***", .true.)
! A case-insensitive algorithm test.
! allpassed=allpassed .and. test("mississippi", "*issip*PI", .true.)
enddo
if (allpassed)then
write(*,'(a)')"Passed",nReps
else
write(*,'(a)')"Failed"
endif
contains
! This is a test program for wildcard matching routines.
! It can be used either to test a single routine for correctness,
! or to compare the timings of two (or more) different wildcard
! matching routines.
!
function test(tame, wild, bExpectedResult) result(bpassed)
use fpm_strings, only : glob
character(len=*) :: tame
character(len=*) :: wild
logical :: bExpectedResult
logical :: bResult
logical :: bPassed
bResult = .true. ! We'll do "&=" cumulative checking.
bPassed = .false. ! Assume the worst.
write(*,*)repeat('=',79)
bResult = glob(tame, wild) ! Call a wildcard matching routine.
! To assist correctness checking, output the two strings in any
! failing scenarios.
if (bExpectedResult .eqv. bResult) then
bPassed = .true.
if(nReps == 1) write(*,*)"Passed match on ",tame," vs. ", wild
else
if(nReps == 1) write(*,*)"Failed match on ",tame," vs. ", wild
endif
end function test
end program demo_glob
Expected output
The article “Matching Wildcards: An Empirical Way to Tame an Algorithm” in Dr Dobb’s Journal, By Kirk J. Krauss, October 07, 2014
Type | Intent | Optional | Attributes | Name | ||
---|---|---|---|---|---|---|
character(len=*) | :: | tame |
A string without wildcards to compare to the globbing expression |
|||
character(len=*) | :: | wild |
A (potentially) corresponding string with wildcards |
result of test
function glob(tame,wild)
! @(#)fpm_strings::glob(3f): function compares text strings, one of which can have wildcards ('*' or '?').
logical :: glob !! result of test
character(len=*) :: tame !! A string without wildcards to compare to the globbing expression
character(len=*) :: wild !! A (potentially) corresponding string with wildcards
character(len=len(tame)+1) :: tametext
character(len=len(wild)+1) :: wildtext
character(len=1),parameter :: NULL=char(0)
integer :: wlen
integer :: ti, wi
integer :: i
character(len=:),allocatable :: tbookmark, wbookmark
! These two values are set when we observe a wildcard character. They
! represent the locations, in the two strings, from which we start once we've observed it.
tametext=tame//NULL
wildtext=wild//NULL
tbookmark = NULL
wbookmark = NULL
wlen=len(wild)
wi=1
ti=1
do ! Walk the text strings one character at a time.
if(wildtext(wi:wi) == '*')then ! How do you match a unique text string?
do i=wi,wlen ! Easy: unique up on it!
if(wildtext(wi:wi)=='*')then
wi=wi+1
else
exit
endif
enddo
if(wildtext(wi:wi)==NULL) then ! "x" matches "*"
glob=.true.
return
endif
if(wildtext(wi:wi) /= '?') then
! Fast-forward to next possible match.
do while (tametext(ti:ti) /= wildtext(wi:wi))
ti=ti+1
if (tametext(ti:ti)==NULL)then
glob=.false.
return ! "x" doesn't match "*y*"
endif
enddo
endif
wbookmark = wildtext(wi:)
tbookmark = tametext(ti:)
elseif(tametext(ti:ti) /= wildtext(wi:wi) .and. wildtext(wi:wi) /= '?') then
! Got a non-match. If we've set our bookmarks, back up to one or both of them and retry.
if(wbookmark/=NULL) then
if(wildtext(wi:)/= wbookmark) then
wildtext = wbookmark;
wlen=len_trim(wbookmark)
wi=1
! Don't go this far back again.
if (tametext(ti:ti) /= wildtext(wi:wi)) then
tbookmark=tbookmark(2:)
tametext = tbookmark
ti=1
cycle ! "xy" matches "*y"
else
wi=wi+1
endif
endif
if (tametext(ti:ti)/=NULL) then
ti=ti+1
cycle ! "mississippi" matches "*sip*"
endif
endif
glob=.false.
return ! "xy" doesn't match "x"
endif
ti=ti+1
wi=wi+1
if (tametext(ti:ti)==NULL) then ! How do you match a tame text string?
if(wildtext(wi:wi)/=NULL)then
do while (wildtext(wi:wi) == '*') ! The tame way: unique up on it!
wi=wi+1 ! "x" matches "x*"
if(wildtext(wi:wi)==NULL)exit
enddo
endif
if (wildtext(wi:wi)==NULL)then
glob=.true.
return ! "x" matches "x"
endif
glob=.false.
return ! "x" doesn't match "xy"
endif
enddo
end function glob