Spaces:

giulio98
/

codebleu

Runtime error

App Files Files Community

giulio98 commited on Nov 7, 2022

Commit

fbda58e

1 Parent(s): facca0d

fix

Browse files

Files changed (27) hide show

.gitattributes +1 -0
__pycache__/bleu.cpython-37.pyc +0 -0
__pycache__/calc_code_bleu.cpython-37.pyc +0 -0
__pycache__/codebleu.cpython-37.pyc +0 -0
__pycache__/dataflow_match.cpython-37.pyc +0 -0
__pycache__/syntax_match.cpython-37.pyc +0 -0
__pycache__/utils.cpython-37.pyc +0 -0
__pycache__/weighted_ngram_match.cpython-37.pyc +0 -0
codebleu.py +0 -8
parser/tree-sitter-c-sharp +0 -1
parser/tree-sitter-cpp +0 -1
parser/tree-sitter-go +0 -1
parser/tree-sitter-java +0 -1
parser/tree-sitter-javascript +0 -1
parser/tree-sitter-php +0 -1
parser/tree-sitter-python +0 -1
parser/tree-sitter-ruby +0 -1
{parser → parsercode}/DFG.py +0 -0
{parser → parsercode}/__init__.py +0 -0
parsercode/__pycache__/DFG.cpython-37.pyc +0 -0
parsercode/__pycache__/__init__.cpython-37.pyc +0 -0
parsercode/__pycache__/utils.cpython-37.pyc +0 -0
{parser → parsercode}/build.py +0 -0
{parser → parsercode}/build.sh +0 -0
{parser → parsercode}/my-languages.so +0 -0
{parser → parsercode}/utils.py +0 -0
utils.py +105 -105

.gitattributes CHANGED Viewed

@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
 parser/my-languages.so filter=lfs diff=lfs merge=lfs -text

 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
 parser/my-languages.so filter=lfs diff=lfs merge=lfs -text
+parsercode/my-languages.so filter=lfs diff=lfs merge=lfs -text

__pycache__/bleu.cpython-37.pyc ADDED Viewed

Binary file (25.1 kB). View file

__pycache__/calc_code_bleu.cpython-37.pyc ADDED Viewed

Binary file (2.91 kB). View file

__pycache__/codebleu.cpython-37.pyc ADDED Viewed

Binary file (2.37 kB). View file

__pycache__/dataflow_match.cpython-37.pyc ADDED Viewed

Binary file (4.18 kB). View file

__pycache__/syntax_match.cpython-37.pyc ADDED Viewed

Binary file (2.13 kB). View file

__pycache__/utils.cpython-37.pyc ADDED Viewed

Binary file (3.34 kB). View file

__pycache__/weighted_ngram_match.cpython-37.pyc ADDED Viewed

Binary file (21.7 kB). View file

codebleu.py CHANGED Viewed

@@ -83,14 +83,6 @@ class CodeBLEU(evaluate.Metric):
             reference_urls=["http://path.to.reference.url/new_module"]
         )
-    def _download_and_prepare(self, dl_manager):
-      """Optional: download external resources useful to compute the scores"""
-      # TODO: Download external resources if needed
-      if self.config_name == "python":
-        Language.build_library('./parser/my-languages.so',['tree-sitter-python'])
-      elif self.config_name == "cpp":
-        Language.build_library('./parser/my-languages.so',['tree-sitter-cpp'])
     def _compute(self, predictions, references, language="python", alpha=0.25, beta=0.25, gamma=0.25, theta=0.25):

             reference_urls=["http://path.to.reference.url/new_module"]
         )
     def _compute(self, predictions, references, language="python", alpha=0.25, beta=0.25, gamma=0.25, theta=0.25):

parser/tree-sitter-c-sharp DELETED Viewed

	@@ -1 +0,0 @@
1	- Subproject commit 5b60f99545fea00a33bbfae5be956f684c4c69e2

parser/tree-sitter-cpp DELETED Viewed

	@@ -1 +0,0 @@
1	- Subproject commit 5ead1e26c6ab71919db0f1880c46a278a93bc5ea

parser/tree-sitter-go DELETED Viewed

	@@ -1 +0,0 @@
1	- Subproject commit 05900faa3cdb5d2d8c8bd5e77ee698487e0a8611

parser/tree-sitter-java DELETED Viewed

	@@ -1 +0,0 @@
1	- Subproject commit 09d650def6cdf7f479f4b78f595e9ef5b58ce31e

parser/tree-sitter-javascript DELETED Viewed

	@@ -1 +0,0 @@
1	- Subproject commit 936d976a782e75395d9b1c8c7c7bf4ba6fe0d86b

parser/tree-sitter-php DELETED Viewed

	@@ -1 +0,0 @@
1	- Subproject commit ab2e72179ceb8bb0b249c8ac9162a148e911b3dc

parser/tree-sitter-python DELETED Viewed

	@@ -1 +0,0 @@
1	- Subproject commit b14614e2144b8f9ee54deed5a24f3c6f51f9ffa8

parser/tree-sitter-ruby DELETED Viewed

	@@ -1 +0,0 @@
1	- Subproject commit 252ca18be76b0918fb6b34c302292b6931876c25

{parser → parsercode}/DFG.py RENAMED Viewed

File without changes

{parser → parsercode}/__init__.py RENAMED Viewed

File without changes

parsercode/__pycache__/DFG.cpython-37.pyc ADDED Viewed

Binary file (33.9 kB). View file

parsercode/__pycache__/__init__.cpython-37.pyc ADDED Viewed

Binary file (437 Bytes). View file

parsercode/__pycache__/utils.cpython-37.pyc ADDED Viewed

Binary file (2.43 kB). View file

{parser → parsercode}/build.py RENAMED Viewed

File without changes

{parser → parsercode}/build.sh RENAMED Viewed

File without changes

{parser → parsercode}/my-languages.so RENAMED Viewed

File without changes

{parser → parsercode}/utils.py RENAMED Viewed

File without changes

utils.py CHANGED Viewed

@@ -1,106 +1,106 @@
-# Natural Language Toolkit: Utility functions
-#
-# Copyright (C) 2001-2020 NLTK Project
-# Author: Steven Bird <[email protected]>
-# URL: <http://nltk.org/>
-# For license information, see LICENSE.TXT
-from itertools import chain
-def pad_sequence(
-    sequence,
-    n,
-    pad_left=False,
-    pad_right=False,
-    left_pad_symbol=None,
-    right_pad_symbol=None,
-):
-    """
-    Returns a padded sequence of items before ngram extraction.
-        >>> list(pad_sequence([1,2,3,4,5], 2, pad_left=True, pad_right=True, left_pad_symbol='<s>', right_pad_symbol='</s>'))
-        ['<s>', 1, 2, 3, 4, 5, '</s>']
-        >>> list(pad_sequence([1,2,3,4,5], 2, pad_left=True, left_pad_symbol='<s>'))
-        ['<s>', 1, 2, 3, 4, 5]
-        >>> list(pad_sequence([1,2,3,4,5], 2, pad_right=True, right_pad_symbol='</s>'))
-        [1, 2, 3, 4, 5, '</s>']
-    :param sequence: the source data to be padded
-    :type sequence: sequence or iter
-    :param n: the degree of the ngrams
-    :type n: int
-    :param pad_left: whether the ngrams should be left-padded
-    :type pad_left: bool
-    :param pad_right: whether the ngrams should be right-padded
-    :type pad_right: bool
-    :param left_pad_symbol: the symbol to use for left padding (default is None)
-    :type left_pad_symbol: any
-    :param right_pad_symbol: the symbol to use for right padding (default is None)
-    :type right_pad_symbol: any
-    :rtype: sequence or iter
-    """
-    sequence = iter(sequence)
-    if pad_left:
-        sequence = chain((left_pad_symbol,) * (n - 1), sequence)
-    if pad_right:
-        sequence = chain(sequence, (right_pad_symbol,) * (n - 1))
-    return sequence
-# add a flag to pad the sequence so we get peripheral ngrams?
-def ngrams(
-    sequence,
-    n,
-    pad_left=False,
-    pad_right=False,
-    left_pad_symbol=None,
-    right_pad_symbol=None,
-):
-    """
-    Return the ngrams generated from a sequence of items, as an iterator.
-    For example:
-        >>> from nltk.util import ngrams
-        >>> list(ngrams([1,2,3,4,5], 3))
-        [(1, 2, 3), (2, 3, 4), (3, 4, 5)]
-    Wrap with list for a list version of this function.  Set pad_left
-    or pad_right to true in order to get additional ngrams:
-        >>> list(ngrams([1,2,3,4,5], 2, pad_right=True))
-        [(1, 2), (2, 3), (3, 4), (4, 5), (5, None)]
-        >>> list(ngrams([1,2,3,4,5], 2, pad_right=True, right_pad_symbol='</s>'))
-        [(1, 2), (2, 3), (3, 4), (4, 5), (5, '</s>')]
-        >>> list(ngrams([1,2,3,4,5], 2, pad_left=True, left_pad_symbol='<s>'))
-        [('<s>', 1), (1, 2), (2, 3), (3, 4), (4, 5)]
-        >>> list(ngrams([1,2,3,4,5], 2, pad_left=True, pad_right=True, left_pad_symbol='<s>', right_pad_symbol='</s>'))
-        [('<s>', 1), (1, 2), (2, 3), (3, 4), (4, 5), (5, '</s>')]
-    :param sequence: the source data to be converted into ngrams
-    :type sequence: sequence or iter
-    :param n: the degree of the ngrams
-    :type n: int
-    :param pad_left: whether the ngrams should be left-padded
-    :type pad_left: bool
-    :param pad_right: whether the ngrams should be right-padded
-    :type pad_right: bool
-    :param left_pad_symbol: the symbol to use for left padding (default is None)
-    :type left_pad_symbol: any
-    :param right_pad_symbol: the symbol to use for right padding (default is None)
-    :type right_pad_symbol: any
-    :rtype: sequence or iter
-    """
-    sequence = pad_sequence(
-        sequence, n, pad_left, pad_right, left_pad_symbol, right_pad_symbol
-    )
-    history = []
-    while n > 1:
-        # PEP 479, prevent RuntimeError from being raised when StopIteration bubbles out of generator
-        try:
-            next_item = next(sequence)
-        except StopIteration:
-            # no more data, terminate the generator
-            return
-        history.append(next_item)
-        n -= 1
-    for item in sequence:
-        history.append(item)
-        yield tuple(history)
         del history[0]

+# Natural Language Toolkit: Utility functions
+#
+# Copyright (C) 2001-2020 NLTK Project
+# Author: Steven Bird <[email protected]>
+# URL: <http://nltk.org/>
+# For license information, see LICENSE.TXT
+from itertools import chain
+def pad_sequence(
+    sequence,
+    n,
+    pad_left=False,
+    pad_right=False,
+    left_pad_symbol=None,
+    right_pad_symbol=None,
+):
+    """
+    Returns a padded sequence of items before ngram extraction.
+        >>> list(pad_sequence([1,2,3,4,5], 2, pad_left=True, pad_right=True, left_pad_symbol='<s>', right_pad_symbol='</s>'))
+        ['<s>', 1, 2, 3, 4, 5, '</s>']
+        >>> list(pad_sequence([1,2,3,4,5], 2, pad_left=True, left_pad_symbol='<s>'))
+        ['<s>', 1, 2, 3, 4, 5]
+        >>> list(pad_sequence([1,2,3,4,5], 2, pad_right=True, right_pad_symbol='</s>'))
+        [1, 2, 3, 4, 5, '</s>']
+    :param sequence: the source data to be padded
+    :type sequence: sequence or iter
+    :param n: the degree of the ngrams
+    :type n: int
+    :param pad_left: whether the ngrams should be left-padded
+    :type pad_left: bool
+    :param pad_right: whether the ngrams should be right-padded
+    :type pad_right: bool
+    :param left_pad_symbol: the symbol to use for left padding (default is None)
+    :type left_pad_symbol: any
+    :param right_pad_symbol: the symbol to use for right padding (default is None)
+    :type right_pad_symbol: any
+    :rtype: sequence or iter
+    """
+    sequence = iter(sequence)
+    if pad_left:
+        sequence = chain((left_pad_symbol,) * (n - 1), sequence)
+    if pad_right:
+        sequence = chain(sequence, (right_pad_symbol,) * (n - 1))
+    return sequence
+# add a flag to pad the sequence so we get peripheral ngrams?
+def ngrams(
+    sequence,
+    n,
+    pad_left=False,
+    pad_right=False,
+    left_pad_symbol=None,
+    right_pad_symbol=None,
+):
+    """
+    Return the ngrams generated from a sequence of items, as an iterator.
+    For example:
+        >>> from nltk.util import ngrams
+        >>> list(ngrams([1,2,3,4,5], 3))
+        [(1, 2, 3), (2, 3, 4), (3, 4, 5)]
+    Wrap with list for a list version of this function.  Set pad_left
+    or pad_right to true in order to get additional ngrams:
+        >>> list(ngrams([1,2,3,4,5], 2, pad_right=True))
+        [(1, 2), (2, 3), (3, 4), (4, 5), (5, None)]
+        >>> list(ngrams([1,2,3,4,5], 2, pad_right=True, right_pad_symbol='</s>'))
+        [(1, 2), (2, 3), (3, 4), (4, 5), (5, '</s>')]
+        >>> list(ngrams([1,2,3,4,5], 2, pad_left=True, left_pad_symbol='<s>'))
+        [('<s>', 1), (1, 2), (2, 3), (3, 4), (4, 5)]
+        >>> list(ngrams([1,2,3,4,5], 2, pad_left=True, pad_right=True, left_pad_symbol='<s>', right_pad_symbol='</s>'))
+        [('<s>', 1), (1, 2), (2, 3), (3, 4), (4, 5), (5, '</s>')]
+    :param sequence: the source data to be converted into ngrams
+    :type sequence: sequence or iter
+    :param n: the degree of the ngrams
+    :type n: int
+    :param pad_left: whether the ngrams should be left-padded
+    :type pad_left: bool
+    :param pad_right: whether the ngrams should be right-padded
+    :type pad_right: bool
+    :param left_pad_symbol: the symbol to use for left padding (default is None)
+    :type left_pad_symbol: any
+    :param right_pad_symbol: the symbol to use for right padding (default is None)
+    :type right_pad_symbol: any
+    :rtype: sequence or iter
+    """
+    sequence = pad_sequence(
+        sequence, n, pad_left, pad_right, left_pad_symbol, right_pad_symbol
+    )
+    history = []
+    while n > 1:
+        # PEP 479, prevent RuntimeError from being raised when StopIteration bubbles out of generator
+        try:
+            next_item = next(sequence)
+        except StopIteration:
+            # no more data, terminate the generator
+            return
+        history.append(next_item)
+        n -= 1
+    for item in sequence:
+        history.append(item)
+        yield tuple(history)
         del history[0]