File: genlengthsorted.rb

package info (click to toggle)
genometools 1.6.1%2Bds-3
  • links: PTS, VCS
  • area: main
  • in suites: bullseye
  • size: 50,412 kB
  • sloc: ansic: 271,241; ruby: 30,339; python: 4,880; sh: 3,193; makefile: 1,194; perl: 219; pascal: 159; haskell: 37; sed: 5
file content (48 lines) | stat: -rwxr-xr-x 1,020 bytes parent folder | download | duplicates (9)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
#!/usr/bin/env ruby

# generate random DNA sequence of approx. the given totallength, such that the
# sequence are ordered according to their length, with the shortest sequences
# coming first. Stefan Kurtz, September 2012

if ARGV.length != 1
  STDERR.puts "Usage: #{$0} <totallength>"
  exit 1
end

srand=37739292920

def randseq(width,len)
  seq = ""
  currentwidth=0
  0.upto(len-1) do |idx|
    r = rand(3)
    cc = ['a','c','g','t'][rand(4)]
    seq += "#{cc}"
    if currentwidth < width
      currentwidth+=1
    else
      seq += "\n"
      currentwidth=0
    end
  end
  return seq.chomp
end

totallength = ARGV[0].to_i
currentlen = 100
currentseqnum = 0
seqnumofthislength = 1 + rand(10)
sumlen = 0
seqnum = 0
while sumlen < totallength
  puts ">sequence #{seqnum} of length #{currentlen}\n#{randseq(70,currentlen)}"
  seqnum+=1
  sumlen += currentlen
  if currentseqnum < seqnumofthislength
    currentseqnum+=1
  else
    currentseqnum=0
    seqnumofthislength = 1 + rand(10)
    currentlen += 43
  end
end