pendar02 commited on
Commit
737cac5
·
verified ·
1 Parent(s): b6f12ab

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -2
app.py CHANGED
@@ -104,8 +104,13 @@ def validate_excel_structure(df):
104
  validation_messages.append("Invalid format in Publication Year column")
105
 
106
  # Check if DOIs are in valid format (basic check)
107
- if not df['DOI'].str.contains(r'10\.\d{4,}/.+', na=True).all():
108
- validation_messages.append("Some DOIs are in invalid format")
 
 
 
 
 
109
 
110
  return len(validation_messages) == 0, validation_messages
111
 
 
104
  validation_messages.append("Invalid format in Publication Year column")
105
 
106
  # Check if DOIs are in valid format (basic check)
107
+ try:
108
+ # Convert DOI column to string and handle NaN values
109
+ doi_series = df['DOI'].fillna('')
110
+ if not doi_series.astype(str).str.contains(r'10\.\d{4,}/.+', na=True).all():
111
+ validation_messages.append("Some DOIs are in invalid format or missing")
112
+ except Exception as e:
113
+ validation_messages.append(f"Error validating DOI format: {str(e)}")
114
 
115
  return len(validation_messages) == 0, validation_messages
116