bash를 사용하여 열에서 세 개 이상의 연속 용어 정렬

Question 1

해결책 awk:

awk '{if(p+1==$1){c+=1}else{ if(c>1){printf "%s-%s %s\n", b, p, s;} c=0;s=""}} c==1{b=p} {p=$1;s=s$2}' file

이번에는 설명이 더 읽기 쉽습니다.

awk '{ 
  if(p+1==$1){
    c+=1 # increment the counter if the value is consecutive
  } else {
    if(c>1){
      # print the begin and end values with the concatenated string
      printf "%s-%s %s\n", b, p, s;
    }
    c=0 # reset the counter
    s="" # reset the string to print
  }
}
c==1{b=p} # set the begin value
{p=$1;s=s$2} # set the previous variable and the string for the next loop
' file

GNU를 사용하여 테스트 awk하고mawk

Answer

해결책 awk:

awk '{if(p+1==$1){c+=1}else{ if(c>1){printf "%s-%s %s\n", b, p, s;} c=0;s=""}} c==1{b=p} {p=$1;s=s$2}' file

이번에는 설명이 더 읽기 쉽습니다.

awk '{ 
  if(p+1==$1){
    c+=1 # increment the counter if the value is consecutive
  } else {
    if(c>1){
      # print the begin and end values with the concatenated string
      printf "%s-%s %s\n", b, p, s;
    }
    c=0 # reset the counter
    s="" # reset the string to print
  }
}
c==1{b=p} # set the begin value
{p=$1;s=s$2} # set the previous variable and the string for the next loop
' file

GNU를 사용하여 테스트 awk하고mawk

Question 2

사용 awk:

$ awk 'function out() { if (start != "") { if (start == prev) printf("%s\t%s\n", prev, string); else printf("%s-%s\t%s\n", start, prev, string) } } $1 != prev + 1 { out(); start = $1; string = "" } { prev = $1; string = string $2 } END { out() }' file
14      R
16      I
21-24   BCQE
33-34   RL
41      K
62-64   FFM
88      B

프로그램 awk:

function out() {
    if (start != "") {
        if (start == prev)
            printf("%s\t%s\n", prev, string)
        else
            printf("%s-%s\t%s\n", start, prev, string)
    }
}

$1 != prev + 1 { out(); start = $1; string = "" }

{ prev = $1; string = string $2 }

END { out() }

프로그램은 의 첫 번째 열에 있는 이전 숫자 prev와 에 있는 두 번째 열의 연결을 추적합니다 string. 이전 첫 번째 열이 현재 첫 번째 열보다 1 적으면 발생하는 모든 일은 업데이트 prev됩니다 string.

넘버링에 "공백"이 있는 경우, out()수집된 데이터를 기록된 간격과 함께 출력하기 위해 호출됩니다 . 이 함수는 입력이 끝날 때 호출되기도 합니다.

쉘의 축어적 동등물은 다음과 같습니다 sh:

out () {
    if [ -n "$start" ]; then
        if [ "$start" = "$prev" ]; then
            printf '%s\t%s\n' "$prev" "$string"
        else
            printf '%s-%s\t%s\n' "$start" "$prev" "$string"
        fi
    fi
}

while read -r num str; do
    if [ "$num" -ne "$(( prev + 1 ))" ]; then
        out
        start=$num
        string=""
    fi

    prev=$num
    string=$string$str
done <file

out

방금 숫자상으로 서로 이어지는 행이 두 개만 있어도 이것이 결합된다는 것을 알았습니다. 나중에 수정할 수도 있지만 지금은 여기에 그대로 두겠습니다.

Answer